changeset 7:aaefa93c2dd2 draft

"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/mafft commit eff9db2cd18c82a7de37851571b8989b48014c71"
author rnateam
date Wed, 15 Apr 2020 15:33:37 -0400
parents c5908940967d
children 4de39704d423
files macros.xml mafft-add.xml mafft.xml test-data/add_seq.fa test-data/mafft_add_result.aln test-data/mafft_custom_result.aln test-data/mafft_fftns_result.aln test-data/mafft_nwns_result.aln
diffstat 8 files changed, 2173 insertions(+), 1137 deletions(-) [+]
line wrap: on
line diff
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/macros.xml	Wed Apr 15 15:33:37 2020 -0400
@@ -0,0 +1,16 @@
+<?xml version="1.0"?>
+<macros>
+    <token name="@VERSION@">1</token>
+    <token name="@TOOL_VERSION@">7.455</token>
+    <xml name="requirements">
+      <requirements>
+          <requirement type="package" version="7.455">mafft</requirement>
+	        <requirement type="package" version="36.3.8">fasta3</requirement>
+      </requirements>
+    </xml>
+    <xml name="citations">
+      <citations>
+          <citation type="doi">10.1093/molbev/mst010</citation>
+      </citations>
+    </xml>
+</macros>
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/mafft-add.xml	Wed Apr 15 15:33:37 2020 -0400
@@ -0,0 +1,88 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<tool id="rbc_mafft_add" name="MAFFT add" version="@TOOL_VERSION@+galaxy@VERSION@">
+  <description>Align a sequence,alignment or fragments to an existing alignment.</description>
+  <macros>
+    <import>macros.xml</import>
+  </macros>
+  <expand macro="requirements" />
+  <stdio>
+    <exit_code range="1:" level="fatal" description="Error occurred. Please check Tool Standard Error" />
+    <exit_code range=":-1" level="fatal" description="Error occurred. Please check Tool Standard Error" />
+  </stdio>
+  <version_command>    <![CDATA[
+    mafft --version
+    ]]>
+  </version_command>
+  <command>
+    <![CDATA[
+      mafft
+      #if $sequences.sequenceType == 'singleseq'
+        $sequences.preservegap  '$inputSequences'
+      #elif $sequences.sequenceType == 'frags'
+        --addfragments '$inputSequences'
+      #elif $sequences.sequenceType == 'group'
+        --addprofile '$inputSequences'
+      #end if
+      $keeplength $map $reorder
+      '$inputAlignment'
+      > '$outputAlignment'
+      #if $map == '--mapout'
+        && mv '${inputSequences}.map' '$outputmap'
+      #end if
+    ]]>
+  </command>
+  <inputs>
+    <param name="inputSequences" type="data" format="fasta" label="Sequences to add to the alignment" help="Amino acid or nucleotide sequences in FASTA format."/>
+    <param name="inputAlignment" type="data" format="fasta" label="Alignment" help="Amino acid or nucleotide sequences in aligned FASTA format."/>
+    <conditional name="sequences">
+      <param name="sequenceType" type="select" label="What do you want to add to the alignment" >
+        <option value="singleseq">A single sequence</option>
+        <option value="frags" selected="true">Fragments</option>
+        <option value="group">An alignment</option>
+      </param>
+      <when value='singleseq'>
+        <param name="preservegap" type="select" label="Preserve the original alignment" help="Keep the given alignment unchanged (--add .)If not, the aligned letters in the seed alignment are preserved but gaps are not necessarily preserved (--seed)">
+          <option value="--add" selected="true" >Yes</option>
+          <option value="--seed">no</option>
+        </param>
+      </when>
+      <when value='frags'/>
+      <when value='group'/>
+    </conditional>
+    <param name="keeplength" type="boolean" truevalue="--keeplength" falsevalue="" checked="True" label="Keep alignment length" help="The alignment length is unchanged.  Insertions at the additional sequences are deleted" />
+    <param name="map" type="boolean" truevalue="--mapout" falsevalue="" checked="False" label="Output a correspondance table of positions (--mapout)" help="Output a correspondence table of positions, sequence.map, between before and after the calculation.  The --mapout option automatically turns on the --keeplength option, to keep the numbering of sites in the reference alignment" />
+    <param name="reorder" type="boolean" truevalue="" falsevalue="--reorder" checked="True" label="Preserve the original order of sequences (--reorder)"  />
+  </inputs>
+  <outputs>
+    <data format="fasta" name="outputAlignment" label="${tool.name} on ${on_string} : New alignment"/>
+    <data name="outputmap" format="tabular" label="${tool.name} on ${on_string} : Correspondance of positions ">
+      <filter>map == True</filter>
+    </data>
+  </outputs>
+  <tests>
+    <test expect_num_outputs="1" >
+      <param name="inputSequences" value="add_seq.fa"/>
+      <param name="inputAlignment" value="mafft_fftns_result.aln"/>
+      <param name="sequenceType" value="singleseq"/>
+      <param name="preservegap" value="--add"/>
+      <param name="keeplength" value="--keeplength"/>
+      <param name="map" value=""/>
+      <output name="outputAlignment" ftype="fasta" file="mafft_add_result.aln"/>
+    </test>
+  </tests>
+  <help>
+    <![CDATA[
+Add one of more sequences to an existing alignment. The new sequence(s) can be complete, fragments, or another alignement.
+
+- Sequences in new_sequences are ungapped and then aligned to existing_alignment.
+- new_sequences is a single multi-FASTA format file.
+- existing_alignment is a single multi-FASTA format file.
+- Gaps in existing_alignment are preserved by default (--add), but it can be deactivated (--seed). In that case the aligned letters in the seed alignment are preserved but gaps are not necessarily preserved.
+- The alignment length may be conserved if the --keeplength option is given. The alignment length is unchanged.  Insertions at the new sequences are deleted.
+- --mapout options output a correspondence table of positions, new_sequences.map, between before and after the calculation.  The --mapout option automatically turns on the --keeplength option, to keep the numbering of sites in the reference alignment.
+- Omit --reorder to preserve the original sequence order.
+
+    ]]>
+  </help>
+  <expand macro="citations" />
+</tool>
--- a/mafft.xml	Sat Nov 11 15:06:34 2017 -0500
+++ b/mafft.xml	Wed Apr 15 15:33:37 2020 -0400
@@ -1,229 +1,294 @@
-<tool id="rbc_mafft" name="MAFFT" version="7.221.3">
-    <description>Multiple alignment program for amino acid or nucleotide sequences</description>
-    <requirements>
-        <requirement type="package" version="7.221">mafft</requirement>
-    </requirements>
-    <stdio>
-        <exit_code range="1:" level="fatal" description="Error occurred. Please check Tool Standard Error" />
-        <exit_code range=":-1" level="fatal" description="Error occurred. Please check Tool Standard Error" />
-    </stdio>
-    <version_command>
-    <![CDATA[
-        mafft --version
-    ]]>
-    </version_command>
-    <command>
-    <![CDATA[
-        #if $cond_flavour.flavourType != 'custom'
-            $cond_flavour.flavourType
-        #elif $cond_flavour.flavourType == 'custom'
-            ### full parameter options
-            mafft
-            $cond_flavour.distance_method
-            --retree $cond_flavour.retree
-            --maxiterate $cond_flavour.iterations
-        #end if
-
-        ## specify threads to use
-        --thread \${GALAXY_SLOTS:-1}
-
-        $datatype
-        --ep $ep
-        --op $op
-        $adjustdirection
-        
-        #if $matrix_condition.matrix == "BLOSUM"
-          --bl ${matrix_condition.BLOSUM}
-        #elif $matrix_condition.matrix == "PAM"
-           --jtt ${matrix_condition.PAM}
-        #end if
-
-        $reorder
-        $getTree
-        $outputFormat
-        $inputSequences > $outputAlignment;
-
-        #if $getTree == "--treeout"
-            mv ${inputSequences}.tree $outputTree;
-        #end if
-    ]]>
-    </command>
-    <inputs>
-        <param name="inputSequences" type="data" format="fasta" label="Sequences to align" help="Amino acid or nucleotide sequences in FASTA format."/>
-        <param name="datatype" type="select" label="Data type">
-            <option value="">Auto detection</option>
-            <option value="--nuc">Nucleic acids</option>
-            <option value="--amino">Amino acids</option>
-        </param>
-        <conditional name="cond_flavour">
-            <param name="flavourType" type="select" label="MAFFT flavour" help="Run mafft with pre-defined input parameters. Specification of these parameters can be found in the help section.">
-                <option value="mafft --auto">auto</option>
-                <option value="mafft-fftns" selected="true">fftns</option>
-                <option value="mafft-fftnsi">fftnsi</option>
-                <option value="mafft-nwns">nwns</option>
-                <option value="mafft-nwnsi">nwnsi</option>
-                <option value="mafft-einsi">einsi</option>
-                <option value="mafft-ginsi">ginsi</option>
-                <option value="mafft-linsi">linsi</option>
-                <option value="mafft-qinsi">qinsi</option>
-                <option value="mafft-xinsi">xinsi</option>
-                <option value="custom">Custom Parameters</option>
-            </param>
-            <when value="mafft-fftns"/>
-            <when value="mafft --auto"/>
-            <when value="mafft-fftnsi"/>
-            <when value="mafft-nwns"/>
-            <when value="mafft-nwnsi"/>
-            <when value="mafft-einsi"/>
-            <when value="mafft-ginsi"/>
-            <when value="mafft-linsi"/>
-            <when value="mafft-qinsi"/>
-            <when value="mafft-xinsi"/>
-            <when value="custom">
-                <param name="distance_method" type="select" display="radio" label="Distance method" help="Distance method must be chosen regarding your data">
-                    <option value="--6merpair" selected="true">Shared 6mers distance (fastest)</option>
-                    <option value="--globalpair">Global alignment (Needleman-Wunsch)</option>
-                    <option value="--localpair">Local alignment (Smith-Waterman)</option>
-                    <option value="--genafpair">Local, affine gap cost</option>
-                </param>
-                <param name="retree" type="integer" value="2" min="1" max="100" label="Guide tree is built this number of times in the progressive stage." help="Valid with 6mer distance" />
-                <param name="iterations" type="integer" value="0" min="0" max="1000" label="Maximum number of iterations" help="1000 for maximum quality" />
-            </when>
-        </conditional>
-        <param name="ep" type="float" value="0.123" label="Gap extend penalty" help="Offset value, which works like gap extension penalty, for group-to-group alignment. For E-INS-i, 0 is recommended to allow large gaps" />
-        <param name="op" type="float" value="1.53" label="Gap opening penalty" help="1.53 default value" />
-        <param name="adjustdirection" type="select" display="radio" label="Direction of nucleotide sequences" help="Generate reverse complement sequences, as necessary, and align them together with the remaining sequences">
-            <option value="--adjustdirection">adjust direction</option>
-            <option value=" " selected="true">do not adjust direction</option>
-        </param>
-        <conditional name="matrix_condition">
-            <param name="matrix" type="select" label="Matrix selection" display="radio" help="Usefull only for amino acids" >
-                <option value="">No matrix</option>
-                <option value="BLOSUM">BLOSUM</option>
-                <option value="PAM">PAM</option>
-            </param>
-            <when value=""/>
-            <when value="BLOSUM">
-                <param name="BLOSUM" type="select" display="radio" label="Coefficient of the BLOSUM matrix">
-                    <option value="30">30</option>
-                    <option value="45">45</option>
-                    <option value="62" selected="true">62</option>
-                    <option value="80">80</option>
-                </param>
-            </when>
-            <when value="PAM">
-                <param name="PAM" type="integer" value="80" min="1" max="350" label="Coefficient of the PAM matrix" />
-            </when>
-        </conditional>
-        <param name="reorder" type="boolean" truevalue="--reorder" falsevalue="" checked="False" label="Reorder output?" />
-        <param name="getTree" type="boolean" truevalue="--treeout" falsevalue="" checked="False" label="Display alignment tree ?" />
-        <param name="outputFormat" type="select" label="Output format" help="Either FASTA or ClustalW">
-            <option value="" selected="true">FASTA</option>
-            <option value="--clustalout">ClustalW</option>
-            <option value="--phylipout">Phylip</option>
-        </param>
-    </inputs>
-    <outputs>
-        <data format="fasta" name="outputAlignment" label="${tool.name} on ${on_string}">
-            <change_format>
-                <when input="outputFormat" value="--clustalout" format="clustal"/>
-                <when input="outputFormat" value="--phylipout" format="phylip"/>
-            </change_format>
-        </data>
-        <data name="outputTree" format="txt" label="${tool.name} Guide Tree">
-            <filter>getTree == True</filter>
-        </data>
-    </outputs>
-    <tests>
-        <test>
-            <param name="inputSequences" value="sample.fa"/>
-            <param name="flavourType" value="mafft-fftns"/>
-            <param name="outputFormat" value=""/>
-            <output name="outputAlignment" ftype="fasta" file="mafft_fftns_result.aln"/>
-        </test>
-        <test>
-            <param name="inputSequences" value="sample.fa"/>
-            <param name="flavourType" value="mafft-nwns"/>
-            <param name="outputFormat" value="--clustalout"/>
-            <output name="outputAlignment" ftype="clustal" file="mafft_nwns_result.aln"/>
-        </test>
-    </tests>
-    <help>
-    <![CDATA[
-**What it does**
-
-MAFFT is a multiple sequence alignment program for unix-like operating systems.  
-It offers a range of multiple alignment methods, L-INS-i (accurate; for alignment of <∼200 sequences), 
-FFT-NS-2 (fast; for alignment of <∼30,000 sequences), etc.
-
-From the MAFFT man page, an overview of the different predefined flavours of the tool.
-
-**Accuracy-oriented methods:**
-
-- L-INS-i (probably most accurate; recommended for <200 sequences; iterative refinement method incorporating local pairwise alignment information):
-    
-    - mafft --localpair --maxiterate 1000 input [> output]
-
-- G-INS-i (suitable for sequences of similar lengths; recommended for <200 sequences; iterative refinement method incorporating global pairwise alignment information):
-    
-    - mafft --globalpair --maxiterate 1000 input [> output]
-
-- E-INS-i (suitable for sequences containing large unalignable regions; recommended for <200 sequences):
-    
-    - mafft --ep 0 --genafpair --maxiterate 1000 input [> output]. For E-INS-i, the --ep 0 option is recommended to allow large gaps. 
-
-
-**Speed-oriented methods:**
-
-- FFT-NS-i (iterative refinement method; two cycles only):
-
-    - mafft --retree 2 --maxiterate 2 input [> output]
-
-- FFT-NS-i (iterative refinement method; max. 1000 iterations):
-
-    - mafft --retree 2 --maxiterate 1000 input [> output]
-
-- FFT-NS-2 (fast; progressive method):
-
-    - mafft --retree 2 --maxiterate 0 input [> output]
-
-- FFT-NS-1 (very fast; recommended for >2000 sequences; progressive method with a rough guide tree):
-
-    - mafft --retree 1 --maxiterate 0 input [> output]
-
-- NW-NS-i (iterative refinement method without FFT approximation; two cycles only):
-
-    - mafft --retree 2 --maxiterate 2 --nofft input [> output]
-
-- NW-NS-2 (fast; progressive method without the FFT approximation):
-
-    - mafft --retree 2 --maxiterate 0 --nofft input [> output]
-
-- NW-NS-PartTree-1 (recommended for ~10,000 to ~50,000 sequences; progressive method with the PartTree algorithm):
-
-    - mafft --retree 1 --maxiterate 0 --nofft --parttree input [> output]
-
-**Options:**
-
---auto
-    Automatically selects an appropriate strategy from L-INS-i, FFT-NS-i and FFT-NS-2, according to data size. Default: off (always FFT-NS-2)
---adjustdirection
-    Generate reverse complement sequences, as necessary, and align them together with the remaining sequences. In the case of protein alignment, these options are just ignored.
---op
-    Gap opening penalty, default: 1.53
---ep
-    Offset (works like gap extension penalty), default: 0.0
---maxiterate
-    Maximum number of iterative refinement, default: 0
---clustalout
-    Output: clustal format, default: fasta
---thread
-    Number of threads (if unsure, --thread -1)
---retree number
-    Guide tree is built number times in the progressive stage.  Valid with 6mer distance.  Default: 2
-    ]]>
-    </help>
-    <citations>
-        <citation type="doi">10.1093/molbev/mst010</citation>
-    </citations>
-</tool>
+<?xml version="1.0" encoding="UTF-8"?>
+<tool id="rbc_mafft" name="MAFFT" version="@TOOL_VERSION@+galaxy@VERSION@">
+  <description>Multiple alignment program for amino acid or nucleotide sequences</description>
+  <macros>
+    <import>macros.xml</import>
+  </macros>
+  <expand macro="requirements" />
+  <stdio>
+    <exit_code range="1:" level="fatal" description="Error occurred. Please check Tool Standard Error" />
+    <exit_code range=":-1" level="fatal" description="Error occurred. Please check Tool Standard Error" />
+  </stdio>
+  <version_command>    <![CDATA[
+    mafft --version
+    ]]>
+  </version_command>
+  <command>
+    <![CDATA[
+
+      #if $cond_flavour.flavourType == 'custom'
+        #if $cond_flavour.dist_flavour.distance_method == '--fastapair'
+          export FASTA_4_MAFFT=`which fasta36`;
+        #end if
+      #end if
+
+      #if $cond_flavour.flavourType != 'custom'
+        $cond_flavour.flavourType
+      #elif $cond_flavour.flavourType == 'custom'
+        ### full parameter options
+        mafft
+        $cond_flavour.dist_flavour.distance_method
+        #if $cond_flavour.dist_flavour.distance_method == '--6merpair'
+          --retree $cond_flavour.dist_flavour.retree
+          $cond_flavour.dist_flavour.distance_method.usetree.parttree
+
+          #if $cond_flavour.dist_flavour.distance_method.usetree.parttree==--parttree
+            $cond_flavour.dist_flavour.distance_method.usetree.treedistance
+            $cond_flavour.dist_flavour.distance_method.usetree.partsize
+            $cond_flavour.dist_flavour.distance_method.usetree.groupsize
+          #end if
+
+        #elif $cond_flavour.dist_flavour.distance_method == '--globalpair'
+          --weighti $cond_flavour.dist_flavour.weighti
+        #elif $cond_flavour.dist_flavour.distance_method == '--localpair'
+          --weighti $cond_flavour.dist_flavour.weighti
+          --lop $cond_flavour.dist_flavour.lop
+          --lep $cond_flavour.dist_flavour.lep
+          --lexp $cond_flavour.dist_flavour.lexp
+        #elif $cond_flavour.dist_flavour.distance_method == '--genafpair'
+          --weighti $cond_flavour.dist_flavour.weighti
+          --lop $cond_flavour.dist_flavour.lop
+          --lep $cond_flavour.dist_flavour.lep
+          --lexp $cond_flavour.dist_flavour.lexp
+          --LOP $cond_flavour.dist_flavour.skipLOP
+          --EXP $cond_flavour.dist_flavour.skipEXP 1
+        #elif $cond_flavour.dist_flavour.distance_method == '--fastapair'
+          --weighti $cond_flavour.dist_flavour.weighti
+        #end if
+        --maxiterate $cond_flavour.iterations
+        $cond_flavour.fft
+        $cond_flavour.score
+      #end if
+
+      ## specify threads to use
+      --thread \${GALAXY_SLOTS:-1}
+      $datatype
+      --ep $ep
+      --op $op
+
+      #if $matrix_condition.matrix == "BLOSUM"
+        --bl $matrix_condition.BLOSUM
+      #elif $matrix_condition.matrix == "PAM"
+        --jtt $matrix_condition.PAM
+        --tm $matrix_condition.tm
+      #elif $matrix_condition.matrix == "custom"
+        --aamatrix  '$matrix_condition.matrixfile'
+        --fmodel $matrix_condition.fmodel
+      #end if
+
+      $reorder
+      $getTree
+      $outputFormat
+      '$inputSequences' > '$outputAlignment';
+
+      #if $getTree == "--treeout"
+        mv '${inputSequences}.tree' '$outputTree';
+      #end if
+    ]]>
+  </command>
+  <inputs>
+    <param name="inputSequences" type="data" format="fasta" label="Sequences to align" help="Amino acid or nucleotide sequences in FASTA format."/>
+    <param name="datatype" type="select" label="Data type">
+      <option value="">Auto detection</option>
+      <option value="--nuc">Nucleic acids</option>
+      <option value="--amino">Amino acids</option>
+    </param>
+    <conditional name="cond_flavour">
+      <param name="flavourType" type="select" label="MAFFT flavour" help="Run mafft with pre-defined input parameters. Specification of these parameters can be found in the help section.">
+        <option value="mafft --auto">auto</option>
+        <option value="mafft-fftns" selected="true">fftns</option>
+        <option value="mafft-fftnsi">fftnsi</option>
+        <option value="mafft-nwns">nwns</option>
+        <option value="mafft-nwnsi">nwnsi</option>
+        <option value="mafft-einsi">einsi</option>
+        <option value="mafft-ginsi">ginsi</option>
+        <option value="mafft-linsi">linsi</option>
+        <option value="mafft-qinsi">qinsi</option>
+        <option value="mafft-xinsi">xinsi</option>
+        <option value="custom">Custom Parameters</option>
+      </param>
+      <when value="mafft-fftns"/>
+      <when value="mafft --auto"/>
+      <when value="mafft-fftnsi"/>
+      <when value="mafft-nwns"/>
+      <when value="mafft-nwnsi"/>
+      <when value="mafft-einsi"/>
+      <when value="mafft-ginsi"/>
+      <when value="mafft-linsi"/>
+      <when value="mafft-qinsi"/>
+      <when value="mafft-xinsi"/>
+      <when value="custom">
+        <conditional name="dist_flavour">
+          <param name="distance_method" type="select" display="radio" label="Distance method" help="Distance method must be chosen regarding your data">
+            <option value="--6merpair" selected="true">Shared 6mers distance (fastest)</option>
+            <option value="--globalpair">Global alignment (Needleman-Wunsch)</option>
+            <option value="--localpair">Local alignment (Smith-Waterman)</option>
+            <option value="--genafpair">Local, affine gap cost</option>
+            <option value="--fastapair">All pairwise alignments are computed with FASTA</option>
+          </param>
+          <when value="--6merpair">
+            <param name="retree" type="integer" value="2" min="1" max="100" label="Guide tree is built this number of times in the progressive stage." help="Valid with 6mer distance" />
+            <conditional name="usetree">
+              <param name="parttree" type="select" label="Use a fast tree-building method?" help="Recommended for a large number (> ~10,000) of sequences are input" >
+                <option value="--parttree" selected="true">Yes</option>
+                <option value="">No</option>
+              </param>
+              <when value="--parttree">
+                <param name="treedistance" type="select" display="radio" label="Distance method" help="Distance method must be chosen regarding your data">
+                  <option value="--fastaparttree" selected="true">Distances based on FASTA</option>
+                  <option value="--dpparttree">Distances based on DP. (Needleman-Wunsch)</option>
+                </param>
+                <param name="partsize" type="integer" value="50" min="0" max="1000" label="Number of partitions in the PartTree algorithm" />
+                <param name="groupsize" type="integer" value="" min="0" max="1000" label="Do not make alignment larger than ... sequences" />
+              </when>
+              <when value=""/>
+            </conditional>
+          </when>
+          <when value="--globalpair">
+            <param name="weighti" type="float" value="2.7" min="1" max="100" label="Weighting factor for the consistency term calculated from pairwise alignments." help="Valid when either of --globalpair, --localpair, --genafpair, --fastapair or --blastpair is selected." />
+          </when>
+          <when value="--localpair">
+            <param name="weighti" type="float" value="2.7" min="1" max="100" label="Weighting factor for the consistency term calculated from pairwise alignments." help="Valid when either of --globalpair, --localpair, --genafpair, --fastapair or --blastpair is selected." />
+            <param name="lop" type="float" value="-2.0" label="Gap opening penalty at local pairwise alignment" help="-2.00 default value" />
+            <param name="lep" type="float" value="0.1" label="Offset value at local pairwise alignment" help="0.1 default value" />
+            <param name="lexp" type="float" value="-0.1" label="Gap extension penalty at local pairwise alignment." help="-0.1 default value" />
+          </when>
+          <when value="--genafpair">
+            <param name="weighti" type="float" value="2.7" min="1" max="100" label="Weighting factor for the consistency term calculated from pairwise alignments." help="Valid when either of --globalpair, --localpair, --genafpair, --fastapair or --blastpair is selected." />
+            <param name="lop" type="float" value="-2.0" label="Gap opening penalty at local pairwise alignment" help="-2.00 default value" />
+            <param name="lep" type="float" value="0.1" label="Offset value at local pairwise alignment" help="0.1 default value" />
+            <param name="lexp" type="float" value="-0.1" label="Gap extension penalty at local pairwise alignment." help="-0.1 default value" />
+            <param name="skipLOP" type="float" value="-6.00" label="Gap opening penalty to skip the alignment" help="-6.00 default value" />
+            <param name="skipEXP" type="float" value="0.00" label="Gap extension penalty to skip the alignment" help="0 default value" />
+          </when>
+          <when value="--fastapair">
+            <param name="weighti" type="float" value="2.7" min="1" max="100" label="Weighting factor for the consistency term calculated from pairwise alignments." help="Valid when either of --globalpair, --localpair, --genafpair, --fastapair or --blastpair is selected." />
+          </when>
+        </conditional>
+        <param name="iterations" type="integer" value="0" min="0" max="1000" label="Maximum number of iterations" help="1000 for maximum quality" />
+        <param name="fft" type="boolean" truevalue="--fft" falsevalue="--nofft" checked="True" label="Use FFT approximation in group-to-group alignment?" />
+        <param name="score" type="boolean" truevalue="" falsevalue="--noscore" checked="True" label="Check alignment score in the iterative refinement stage?" />
+      </when>
+    </conditional>
+    <param name="ep" type="float" value="0.0" label="Gap extend penalty for group-to-group alignment" help="Offset value, which works like gap extension penalty, for group-to-group alignment. For E-INS-i, 0 is recommended to allow large gaps" />
+    <param name="op" type="float" value="1.53" label="Gap opening penalty at group-to-group alignment." help="1.53 default value" />
+    <conditional name="matrix_condition">
+      <param name="matrix" type="select" label="Matrix selection" display="radio" help="Usefull only for amino acids" >
+        <option value="">No matrix</option>
+        <option value="BLOSUM" selected="true">BLOSUM</option>
+        <option value="PAM">PAM</option>
+        <option value="custom">Custom</option>
+      </param>
+      <when value=""/>
+      <when value="BLOSUM">
+        <param name="BLOSUM" type="select" display="radio" label="Coefficient of the BLOSUM matrix">
+          <option value="30">30</option>
+          <option value="45">45</option>
+          <option value="62" selected="true">62</option>
+          <option value="80">80</option>
+        </param>
+      </when>
+      <when value="PAM">
+        <param name="PAM" type="integer" value="80" min="1" max="350" label="Coefficient of the JTT PAM matrix" />
+        <param name="tm" type="integer" value="80" min="1" max="350" label="Coefficient of the  transmembrane PAM matrix" />
+      </when>
+      <when value="custom">
+        <param name="matrixfile" type="data" format="txt" label="User-defined AA scoring matrix" help="The format of matrixfile is the same to that of BLAST. Ignored when nucleotide sequences are input."/>
+        <param name="fmodel" type="boolean" truevalue="--fmodel" falsevalue="" checked="False" label="Incorporate the AA/nuc composition information into the scoring matrix?" />
+      </when>
+    </conditional>
+    <param name="reorder" type="boolean" truevalue="--reorder" falsevalue="" checked="False" label="Reorder output?" />
+    <param name="getTree" type="boolean" truevalue="--treeout" falsevalue="" checked="False" label="Display alignment tree ?" />
+    <param name="outputFormat" type="select" label="Output format" help="Either FASTA or ClustalW">
+      <option value="" selected="true">FASTA</option>
+      <option value="--clustalout">ClustalW</option>
+      <option value="--phylipout">Phylip</option>
+    </param>
+  </inputs>
+  <outputs>
+    <data format="fasta" name="outputAlignment" label="${tool.name} on ${on_string}">
+      <change_format>
+        <when input="outputFormat" value="--clustalout" format="clustal"/>
+        <when input="outputFormat" value="--phylipout" format="phylip"/>
+      </change_format>
+    </data>
+    <data name="outputTree" format="txt" label="${tool.name} Guide Tree">
+      <filter>getTree == True</filter>
+    </data>
+  </outputs>
+  <tests>
+    <test expect_num_outputs="1" >
+      <param name="inputSequences" value="sample.fa"/>
+      <param name="flavourType" value="mafft-fftns"/>
+      <param name="outputFormat" value=""/>
+      <output name="outputAlignment" ftype="fasta" file="mafft_fftns_result.aln"/>
+    </test>
+    <test expect_num_outputs="1" >
+      <param name="inputSequences" value="sample.fa"/>
+      <param name="flavourType" value="mafft-nwns"/>
+      <param name="outputFormat" value="--clustalout"/>
+      <output name="outputAlignment" ftype="clustal" file="mafft_nwns_result.aln"/>
+    </test>
+    <test expect_num_outputs="1" >
+      <param name="inputSequences" value="sample.fa"/>
+      <param name="flavourType" value="custom"/>
+      <param name="matrix_condition" value="BLOSUM"/>
+      <param name="BLOSUM" value="62"/>
+      <param name="distance_method" value="--fastapair"/>
+      <param name="weighti" value="2.7"/>
+      <param name="iterations" value="1000"/>
+      <param name="outputFormat" value="--clustalout"/>
+      <output name="outputAlignment" ftype="clustal" file="mafft_custom_result.aln"/>
+    </test>
+  </tests>
+  <help>    <![CDATA[
+      **What it does**
+      MAFFT is a multiple sequence alignment program for unix-like operating systems.
+      It offers a range of multiple alignment methods, L-INS-i (accurate; for alignment of <∼200 sequences),
+      FFT-NS-2 (fast; for alignment of <∼30,000 sequences), etc.
+      From the MAFFT man page, an overview of the different predefined flavours of the tool.
+      **Accuracy-oriented methods:**
+      - L-INS-i (probably most accurate; recommended for <200 sequences; iterative refinement method incorporating local pairwise alignment information):
+      - mafft --localpair --maxiterate 1000 input [> output]
+      - G-INS-i (suitable for sequences of similar lengths; recommended for <200 sequences; iterative refinement method incorporating global pairwise alignment information):
+      - mafft --globalpair --maxiterate 1000 input [> output]
+      - E-INS-i (suitable for sequences containing large unalignable regions; recommended for <200 sequences):
+      - mafft --ep 0 --genafpair --maxiterate 1000 input [> output]. For E-INS-i, the --ep 0 option is recommended to allow large gaps.
+      **Speed-oriented methods:**
+      - FFT-NS-i (iterative refinement method; two cycles only):
+      - mafft --retree 2 --maxiterate 2 input [> output]
+      - FFT-NS-i (iterative refinement method; max. 1000 iterations):
+      - mafft --retree 2 --maxiterate 1000 input [> output]
+      - FFT-NS-2 (fast; progressive method):
+      - mafft --retree 2 --maxiterate 0 input [> output]
+      - FFT-NS-1 (very fast; recommended for >2000 sequences; progressive method with a rough guide tree):
+      - mafft --retree 1 --maxiterate 0 input [> output]
+      - NW-NS-i (iterative refinement method without FFT approximation; two cycles only):
+      - mafft --retree 2 --maxiterate 2 --nofft input [> output]
+      - NW-NS-2 (fast; progressive method without the FFT approximation):
+      - mafft --retree 2 --maxiterate 0 --nofft input [> output]
+      - NW-NS-PartTree-1 (recommended for ~10,000 to ~50,000 sequences; progressive method with the PartTree algorithm):
+      - mafft --retree 1 --maxiterate 0 --nofft --parttree input [> output]
+
+      **Options:**
+      --auto
+      Automatically selects an appropriate strategy from L-INS-i, FFT-NS-i and FFT-NS-2, according to data size. Default: off (always FFT-NS-2)
+      --adjustdirection
+      Generate reverse complement sequences, as necessary, and align them together with the remaining sequences. In the case of protein alignment, these options are just ignored.
+      --op
+      Gap opening penalty, default: 1.53
+      --ep
+      Offset (works like gap extension penalty), default: 0.0
+      --maxiterate
+      Maximum number of iterative refinement, default: 0
+      --clustalout
+      Output: clustal format, default: fasta
+      --thread
+      Number of threads (if unsure, --thread -1)
+      --retree number
+      Guide tree is built number times in the progressive stage.
+      Valid with 6mer distance.  Default: 2
+      ]]>
+    </help>
+  <expand macro="citations" />
+</tool>
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/add_seq.fa	Wed Apr 15 15:33:37 2020 -0400
@@ -0,0 +1,2 @@
+>     1== M63632   1 Lampetra japonica rhodopsin <>[BBRC174,1125-1132'91]
+MNGTEGDNFYVPFSNKTGLARSPYEYPQYYLAEPWKYSALAAYMFFLILVGFPVNFLTLF
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/mafft_add_result.aln	Wed Apr 15 15:33:37 2020 -0400
@@ -0,0 +1,481 @@
+>     1== M63632   1 Lampetra japonica rhodopsin <>[BBRC174,1125-1132'91]
+----------------------------------------MNG----------------T
+E--G--DNFYVP----FSNKTGLARSPYEYPQY-------YLAEPWK---------YSAL
+AAYMFFLILVGFPVNFLTLFVTVQHKKLRTPLNYILLNLAMANLFMVLFG-FTVTMYTSM
+N-GYFV--FGPTMCSIEGFFATLGGEVALWSLVVLAIERYIVICKPMGN-FRFGNTHAIM
+GVAFTWIMALAC-AAPPLVG-W-----SRYIPEGMQCSCGPDYYTLNPNFNNESYVVYMF
+VVHFLVPFVIIFFCYGRLLCTV----KEAAAAQQ--------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+-------------ESASTQK------AEKEVTRMVVLMVIGFLVCWVPYASVAFYIFT-H
+QGS--DFGATFMTLPAFFAKSSALYNPVIYILMNKQFRNCMITTLCC--------GKNPL
+GDDE--SGASTSKTEVSSVS-TSPVSPA--------------------------------
+---------------------------------------------------------
+>     2== U22180   1 rat opsin <rod>[J.Mol.Neurosci.5(3),207-209'94]
+----------------------------------------MNG----------------T
+E--G--PNFYVP----FSNITGVVRSPFEQPQY-------YLAEPWQ---------FSML
+AAYMFLLIVLGFPINFLTLYVTVQHKKLRTPLNYILLNLAVADLFMVFGG-FTTTLYTSL
+H-GYFV--FGPTGCNLEGFFATLGGEIGLWSLVVLAIERYVVVCKPMSN-FRFGENHAIM
+GVAFTWVMALAC-AAPPLVG-W-----SRYIPEGMQCSCGIDYYTLKPEVNNESFVIYMF
+VVHFTIPMIVIFFCYGQLVFTV----KEAAAQQQ--------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+-------------ESATTQK------AEKEVTRMVIIMVIFFLICWLPYASVAMYIFT-H
+QGS--NFGPIFMTLPAFFAKTASIYNPIIYIMMNKQFRNCMLTSLCC--------GKNPL
+GDDE--ASATASKTE------TSQVAPA--------------------------------
+---------------------------------------------------------
+>     3== M92038   1 chicken green sensitive cone opsin <retina>[PNAS89,5932-5936'9
+----------------------------------------MNG----------------T
+E--G--INFYVP----MSNKTGVVRSPFEYPQY-------YLAEPWK---------YRLV
+CCYIFFLISTGLPINLLTLLVTFKHKKLRQPLNYILVNLAVADLFMACFG-FTVTFYTAW
+N-GYFV--FGPVGCAVEGFFATLGGQVALWSLVVLAIERYIVVCKPMGN-FRFSATHAMM
+GIAFTWVMAFSC-AAPPLFG-W-----SRYMPEGMQCSCGPDYYTHNPDYHNESYVLYMF
+VIHFIIPVVVIFFSYGRLICKV----REAAAQQQ--------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+-------------ESATTQK------AEKEVTRMVILMVLGFMLAWTPYAVVAFWIFT-N
+KGA--DFTATLMAVPAFFSKSSSLYNPIIYVLMNKQFRNCMITTICC--------GKNPF
+GDEDVSSTVSQSKTEVSSVS-SSQVSPA--------------------------------
+---------------------------------------------------------
+>     4=p A45229 opsin, green-sensitive (clone GFgr-1) - goldfish
+----------------------------------------MNG----------------T
+E--G--KNFYVP----MSNRTGLVRSPFEYPQY-------YLAEPWQ---------FKIL
+ALYLFFLMSMGLPINGLTLVVTAQHKKLRQPLNFILVNLAVAGTIMVCFG-FTVTFYTAI
+N-GYFV--LGPTGCAVEGFMATLGGEVALWSLVVLAIERYIVVCKPMGS-FKFSSSHAFA
+GIAFTWVMALAC-AAPPLFG-W-----SRYIPEGMQCSCGPDYYTLNPDYNNESYVIYMF
+VCHFILPVAVIFFTYGRLVCTV----KAAAAQQQ--------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+-------------DSASTQK------AEREVTKMVILMVFGFLIAWTPYATVAAWIFF-N
+KGA--DFSAKFMAIPAFFSKSSALYNPVIYVLLNKQFRNCMLTTIFC--------GKNPL
+GDDE-SSTVSTSKTEVSS------VSPA--------------------------------
+---------------------------------------------------------
+>     5=p B45229 opsin, green-sensitive (clone GFgr-2) - goldfish
+----------------------------------------MNG----------------T
+E--G--NNFYVP----LSNRTGLVRSPFEYPQY-------YLAEPWQ---------FKLL
+AVYMFFLICLGLPINGLTLICTAQHKKLRQPLNFILVNLAVAGAIMVCFG-FTVTFYTAI
+N-GYFA--LGPTGCAVEGFMATLGGEVALWSLVVLAIERYIVVCKPMGS-FKFSSTHASA
+GIAFTWVMAMAC-AAPPLVG-W-----SRYIPEGIQCSCGPDYYTLNPEYNNESYVLYMF
+ICHFILPVTIIFFTYGRLVCTV----KAAAAQQQ--------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+-------------DSASTQK------AEREVTKMVILMVLGFLVAWTPYATVAAWIFF-N
+KGA--AFSAQFMAIPAFFSKTSALYNPVIYVLLNKQFRSCMLTTLFC--------GKNPL
+GDEE-SSTVSTSKTEVSS------VSPA--------------------------------
+---------------------------------------------------------
+>     6== L11864   1 Carassius auratus blue cone opsin <retina>[Biochemistry32,208-
+----------------------------------------MKQ----------------V
+PEFH--EDFYIPIPLDINNLS--AYSPFLVPQD-------HLGNQGI---------FMAM
+SVFMFFIFIGGASINILTILCTIQFKKLRSHLNYILVNLSIANLFVAIFG-SPLSFYSFF
+N-RYFI--FGATACKIEGFLATLGGMVGLWSLAVVAFERWLVICKPLGN-FTFKTPHAIA
+GCILPWISALAA-SLPPLFG-W-----SRYIPEGLQCSCGPDWYTTNNKYNNESYVMFLF
+CFCFAVPFGTIVFCYGQLLITL----KLAAKAQA--------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+-------------DSASTQK------AEREVTKMVVVMVLGFLVCWAPYASFSLWIVS-H
+RGE--EFDLRMATIPSCLSKASTVYNPVIYVLMNKQFRSCMM-KMVC--------GKN-I
+EEDE--ASTSSQVTQVSS------VAPEK-------------------------------
+---------------------------------------------------------
+>     7== M13299   1 human BCP <>[Science232(4747),193-202'86]
+----------------------------------------MRK----------------M
+S--E--EEFYL-----FKNIS--SVGPWDGPQY-------HIAPVWA---------FYLQ
+AAFMGTVFLIGFPLNAMVLVATLRYKKLRQPLNYILVNVSFGGFLLCIFS-VFPVFVASC
+N-GYFV--FGRHVCALEGFLGTVAGLVTGWSLAFLAFERYIVICKPFGN-FRFSSKHALT
+VVLATWTIGIGV-SIPPFFG-W-----SRFIPEGLQCSCGPDWYTVGTKYRSESYTWFLF
+IFCFIVPLSLICFSYTQLLRAL----KAVAAQQQ--------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+-------------ESATTQK------AEREVSRMVVVMVGSFCVCYVPYAAFAMYMVN-N
+RNH--GLDLRLVTIPSFFSKSACIYNPIIYCFMNKQFQACIM-KMVC--------GKA-M
+TDES--DTCSSQKTEVSTVS-STQVGPN--------------------------------
+---------------------------------------------------------
+>     8=opsin, greensensitive  human (fragment) S07060
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------DLAETVIA-STISIVNQV
+S-GYFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWLVVCKPFGN-VRFDAKLAIV
+GIAFSWIWAAVW-TAPPIFG-W-----SRYWPHGLKTSCGPDVFSGSSYPGVQSYMIVLM
+VTCCITPLSIIVLCYLQVWLAI----RAVAKQQK--------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+-------------ESESTQK------AEKEVTRMVVVMVLAFC-----------------
+------------------------------------------------------------
+------------------------------------------------------------
+---------------------------------------------------------
+>     9== K03494   1 human GCP <>[Science232(4747),193-202'86]
+----------------------------------------MAQQWSLQRLAGRHPQDSYE
+DSTQ--SSIFT-----YTNSNS-TRGPFEGPNY-------HIAPRWV---------YHLT
+SVWMIFVVIASVFTNGLVLAATMKFKKLRHPLNWILVNLAVADLAETVIA-STISVVNQV
+Y-GYFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWMVVCKPFGN-VRFDAKLAIV
+GIAFSWIWAAVW-TAPPIFG-W-----SRYWPHGLKTSCGPDVFSGSSYPGVQSYMIVLM
+VTCCITPLSIIVLCYLQVWLAI----RAVAKQQK--------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+-------------ESESTQK------AEKEVTRMVVVMVLAFCFCWGPYAFFACFAAA-N
+PGY--PFHPLMAALPAFFAKSATIYNPVIYVFMNRQFRNCIL-QLF---------GKK-V
+DDGS--ELSSASKTEVSSV---SSVSPA--------------------------------
+---------------------------------------------------------
+>    10== Z68193   1 human Red Opsin <>[]
+----------------------------------------MAQQWSLQRLAGRHPQDSYE
+DSTQ--SSIFT-----YTNSNS-TRGPFEGPNY-------HIAPRWV---------YHLT
+SVWMIFVVTASVFTNGLVLAATMKFKKLRHPLNWILVNLAVADLAETVIA-STISIVNQV
+S-GYFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWLVVCKPFGN-VRFDAKLAIV
+GIAFSWIWSAVW-TAPPIFG-W-----SRYWPHGLKTSCGPDVFSGSSYPGVQSYMIVLM
+VTCCIIPLAIIMLCYLQVWLAI----RAVAKQQK--------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+-------------ESESTQK------AEKEVTRMVVVMIFAYCVCWGPYTFFACFAAA-N
+PGY--AFHPLMAALPAYFAKSATIYNPVIYVFMNRQFRNCIL-QLF---------GKK-V
+DDGS--ELSSASKTEVSSV---SSVSPA--------------------------------
+---------------------------------------------------------
+>    11== M92036   1 Gecko gecko P521 <retina>[PNAS89,6841-6845'92]
+----------------------------------------MTEAWNVAVFAARRSRDD-D
+DTTR--GSVFT-----YTNTNN-TRGPFEGPNY-------HIAPRWV---------YNLV
+SFFMIIVVIASCFTNGLVLVATAKFKKLRHPLNWILVNLAFVDLVETLVA-STISVFNQI
+F-GYFI--LGHPLCVIEGYVVSSCGITGLWSLAIISWERWFVVCKPFGN-IKFDSKLAII
+GIVFSWVWAWGW-SAPPIFG-W-----SRYWPHGLKTSCGPDVFSGSVELGCQSFMLTLM
+ITCCFLPLFIIIVCYLQVWMAI----RAVAAQQK--------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+-------------ESESTQK------AEREVSRMVVVMIVAFCICWGPYASFVSFAAA-N
+PGY--AFHPLAAALPAYFAKSATIYNPVIYVFMNRQFRNCIM-QLF---------GKK-V
+DDGS--EASTTSRTEVSSVS-NSSVAPA--------------------------------
+---------------------------------------------------------
+>    12== M62903   1 chicken visual pigment <>[BBRC173,1212-1217'90]
+----------------------------------------MAA-WEAAFAARRRHEE--E
+DTTR--DSVFT-----YTNSNN-TRGPFEGPNY-------HIAPRWV---------YNLT
+SVWMIFVVAASVFTNGLVLVATWKFKKLRHPLNWILVNLAVADLGETVIA-STISVINQI
+S-GYFI--LGHPMCVVEGYTVSACGITALWSLAIISWERWFVVCKPFGN-IKFDGKLAVA
+GILFSWLWSCAW-TAPPIFG-W-----SRYWPHGLKTSCGPDVFSGSSDPGVQSYMVVLM
+VTCCFFPLAIIILCYLQVWLAI----RAVAAQQK--------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+-------------ESESTQK------AEKEVSRMVVVMIVAYCFCWGPYTFFACFAAA-N
+PGY--AFHPLAAALPAYFAKSATIYNPIIYVFMNRQFRNCIL-QLF---------GKK-V
+DDGS--EVST-SRTEVSSVS-NSSVSPA--------------------------------
+---------------------------------------------------------
+>    13== S75720   1 chicken P-opsin <>[Science267(5203),1502-1506'95]
+----------------------------------------MS-----------------S
+NSSQ--AP-----------PNG-TPGPFDGPQW------PYQAPQST---------YVGV
+AVLMGTVVACASVVNGLVIVVSICYKKLRSPLNYILVNLAVADLLVTLCG-SSVSLSNNI
+N-GFFV--FGRRMCELEGFMVSLTGIVGLWSLAILALERYVVVCKPLGD-FQFQRRHAVS
+GCAFTWGWALLW-SAPPLLG-W-----SSYVPEGLRTSCGPNWYTGGSNN--NSYILSLF
+VTCFVLPLSLILFSYTNLLLTL----RAAAAQQK--------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+-------------EADTTQR------AEREVTRMVIVMVMAFLLCWLPYSTFALVVAT-H
+KGI--IIQPVLASLPSYFSKTATVYNPIIYVFMNKQFQSCLL-EMLCCGY----QPQR-T
+GKAS--PGTPGPHADVTAAGLRNKVMPAHPV-----------------------------
+---------------------------------------------------------
+>    14== M17718   1 D.melanogaster Rh3 <>[J.Neurosci.7,1550-1557'87]
+----------MESGNVSS------------SLFGNVST-ALRP----------------E
+ARLS--A----------ETRLLGWNVPPEELR--------HIPEHWLTYPEPPESMNYLL
+GTLYIFFTLMSMLGNGLVIWVFSAAKSLRTPSNILVINLAFCDFMMMVK--TPIFIYNSF
+H-QGYA--LGHLGCQIFGIIGSYTGIAAGATNAFIAYDRFNVITRPMEG--KMTHGKAIA
+MIIFIYMYATPW-VVACYTETW-----GRFVPEGYLTSCTFDYLT--DNFDTRLFVACIF
+FFSFVCPTTMITYYYSQIVGHVFSHEKALRDQAKK-------------------------
+--------------------------------------------------MN--------
+--VESL------------------------------------------------------
+----------RSNVDKNKET------AEIRIAKAAITICFLFFCSWTPYGVMSLIGAF-G
+DKT--LLTPGATMIPACACKMVACIDPFVYAISHPRYRMELQKRCPWLAL---------N
+EKAP--ESSAVASTSTTQEP--QQTTAA--------------------------------
+---------------------------------------------------------
+>    15== X65879   1 Drosophila pseudoobscura Dpse\Rh3 <>[Genetics132(1),193-204'92
+----------MEYHNVSS------------VL-GNVSS-VLRP----------------D
+ARLS--A----------ESRLLGWNVPPDELR--------HIPEHWLIYPEPPESMNYLL
+GTLYIFFTVISMIGNGLVMWVFSAAKSLRTPSNILVINLAFCDFMMMIK--TPIFIYNSF
+H-QGYA--LGHLGCQIFGVIGSYTGIAAGATNAFIAYDRYNVITRPMEG--KMTHGKAIA
+MIIFIYLYATPW-VVACYTESW-----GRFVPEGYLTSCTFDYLT--DNFDTRLFVACIF
+FFSFVCPTTMITYYYSQIVGHVFSHEKALRDQAKK-------------------------
+--------------------------------------------------MN--------
+--VDSL------------------------------------------------------
+----------RSNVDKSKEA------AEIRIAKAAITICFLFFASWTPYGVMSLIGAF-G
+DKT--LLTPGATMIPACTCKMVACIDPFVYAISHPRYRMELQKRCPWLAI---------S
+EKAP--ESRAAISTSTTQEQ--QQTTAA--------------------------------
+---------------------------------------------------------
+>    16== M17730   1 D.melanogaster Rh4 opsin <>[J.Neurosci.7,1558-1566'87]
+----------ME------------------PL-CNASEPPLRP----------------E
+AR-S--SG---N----GDLQFLGWNVPPDQIQ--------YIPEHWLTQLEPPASMHYML
+GVFYIFLFCASTVGNGMVIWIFSTSKSLRTPSNMFVLNLAVFDLIMCLK--APIF--NSF
+H-RGFAIYLGNTWCQIFASIGSYSGIGAGMTNAAIGYDRYNVITKPMNR--NMTFTKAVI
+MNIIIWLYCTPW-VVLPLTQFW-----DRFVPEGYLTSCSFDYLS--DNFDTRLFVGTIF
+FFSFVCPTLMILYYYSQIVGHVFSHEKALREQAKK-------------------------
+--------------------------------------------------MN--------
+--VESL------------------------------------------------------
+----------RSNVDKSKET------AEIRIAKAAITICFLFFVSWTPYGVMSLIGAF-G
+DKS--LLTQGATMIPACTCKLVACIDPFVYAISHPRYRLELQKRCPWLGV---------N
+EKSG--EISSAQST-TTQEQ--QQTTAA--------------------------------
+---------------------------------------------------------
+>    17== X65880   1 Drosophila pseudoobscura Dpse\Rh4 <>[Genetics132(1),193-204'92
+----------MD------------------AL-CNASEPPLRP----------------E
+ARMS--SG---S----DELQFLGWNVPPDQIQ--------YIPEHWLTQLEPPASMHYML
+GVFYIFLFFASTLGNGMVIWIFSTSKSLRTPSNMFVLNLAVFDLIMCLK--APIFIYNSF
+H-RGFA--LGNTWCQIFASIGSYSGIGAGMTNAAIGYDRYNVITKPMNR--NMTFTKAVI
+MNIIIWLYCTPW-VVLPLTQFW-----DRFVPEGYLTSCSFDYLS--DNFDTRLFVGTIF
+LFSFVVPTLMILYYYSQIVGHVFNHEKALREQAKK-------------------------
+--------------------------------------------------MN--------
+--VESL------------------------------------------------------
+----------RSNVDKSKET------AEIRIAKAAITICFLFFVSWTPYGVMSLIGAF-G
+DKS--LLTPGATMIPACTCKLVACIEPFVYAISHPRYRMELQKRCPWLGV---------N
+EKSG--EASSAQST-TTQEQ-TQQTSAA--------------------------------
+---------------------------------------------------------
+>    18== D50584   1 Hemigrapsus sanguineus opsin BcRh2 <compound eye>[J.Exp.Biol.1
+--------------------------------MTNATGPQMAY----------------Y
+GAAS--MD-FGY----PEGVSIVDFVRPEIKP--------YVHQHWYNYPPVNPMWHYLL
+GVIYLFLGTVSIFGNGLVIYLFNKSAALRTPANILVVNLALSDLIMLTTN-VPFFTYNCF
+SGGVWM--FSPQYCEIYACLGAITGVCSIWLLCMISFDRYNIICNGFNG-PKLTTGKAVV
+FALISWVIAIGC-ALPPFFG-W-----GNYILEGILDSCSYDYLT--QDFNTFSYNIFIF
+VFDYFLPAAIIVFSYVFIVKAIFAHEAAMRAQAKK-------------------------
+--------------------------------------------------MN--------
+--VSTL------------------------------------------------------
+----------RS-NEADAQR------AEIRIAKTALVNVSLWFICWTPYALISLKGVM-G
+DTS--GITPLVSTLPALLAKSCSCYNPFVYAISHPKYRLAITQHLPWFCV------HE-T
+ETKS--NDDSQSNSTVAQDK-A--------------------------------------
+---------------------------------------------------------
+>    19== D50583   1 Hemigrapsus sanguineus opsin BcRh1 <compound eye>[J.Exp.Biol.1
+--------------------------------MANVTGPQMAF----------------Y
+GSGA--AT-FGY----PEGMTVADFVPDRVKH--------MVLDHWYNYPPVNPMWHYLL
+GVVYLFLGVISIAGNGLVIYLYMKSQALKTPANMLIVNLALSDLIMLTTN-FPPFCYNCF
+SGGRWM--FSGTYCEIYAALGAITGVCSIWTLCMISFDRYNIICNGFNG-PKLTQGKATF
+MCGLAWVISVGW-SLPPFFG-W-----GSYTLEGILDSCSYDYFT--RDMNTITYNICIF
+IFDFFLPASVIVFSYVFIVKAIFAHEAAMRAQAKK-------------------------
+--------------------------------------------------MN--------
+--VTNL------------------------------------------------------
+----------RS-NEAETQR------AEIRIAKTALVNVSLWFICWTPYAAITIQGLL-G
+NAE--GITPLLTTLPALLAKSCSCYNPFVYAISHPKFRLAITQHLPWFCV------HE-K
+DPND--VEENQSSNTQTQEK-S--------------------------------------
+---------------------------------------------------------
+>    20== K02320   1 D.melanogaster opsin <>[Cell40,851-858'85]
+----------ME----SF------------AVAAAQLGPHFAP----------------L
+S-----------------NGSVVDKVTPDMAH--------LISPYWNQFPAMDPIWAKIL
+TAYMIMIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAISDFGIMITN-TPMMGINLY
+F-ETWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQVIVKGMAG-RPMTIPLALG
+KM---------------------------YVPEGNLTSCGIDYLE--RDWNPRSYLIFYS
+IFVYYIPLFLICYSYWFIIAAVSAHEKAMREQAKK-------------------------
+--------------------------------------------------MN--------
+--VKSL------------------------------------------------------
+----------RS-SEDAEKS------AEGKLAKVALVTITLWFMAWTPYLVINCMGLF-K
+F-E--GLTPLNTIWGACFAKSAACYNPIVYGISHPKYRLALKEKCPCCVF------GK-V
+DDGK--SSDAQSQA-TASEA-ESKA-----------------------------------
+---------------------------------------------------------
+>    21== K02315   1 D.melanogaster ninaE <>[Cell40,839-850'85]
+----------ME----SF------------AVAAAQLGPHFAP----------------L
+S-----------------NGSVVDKVTPDMAH--------LISPYWNQFPAMDPIWAKIL
+TAYMIMIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAISDFGIMITN-TPMMGINLY
+F-ETWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQVIVKGMAG-RPMTIPLALG
+KIAYIWFMSSIW-CLAPAFG-W-----SRYVPEGNLTSCGIDYLE--RDWNPRSYLIFYS
+IFVYYIPLFLICYSYWFIIAAVSAHEKAMREQAKK-------------------------
+--------------------------------------------------MN--------
+--VKSL------------------------------------------------------
+----------RS-SEDAEKS------AEGKLAKVALVTITLWFMAWTPYLVINCMGLF-K
+F-E--GLTPLNTIWGACFAKSAACYNPIVYGISHPKYRLALKEKCPCCVF------GK-V
+DDGK--SSDAQSQA-TASEA-ESKA-----------------------------------
+---------------------------------------------------------
+>    22== X65877   1 Drosophila pseudoobscura Dpse\ninaE <>[Genetics132(1),193-204'
+----------MD----SF------------AAVATQLGPQFAA----------------P
+S-----------------NGSVVDKVTPDMAH--------LISPYWDQFPAMDPIWAKIL
+TAYMIIIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAISDFGIMITN-TPMMGINLY
+F-ETWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQVIVKGMAG-RPMTIPLALG
+KIAYIWFMSTIWCCLAPVFG-W-----SRYVPEGNLTSCGIDYLE--RDWNPRSYLIFYS
+IFVYYIPLFLICYSYWFIIAAVSAHEKAMREQAKK-------------------------
+--------------------------------------------------MN--------
+--VKSL------------------------------------------------------
+----------RS-SEDADKS------AEGKLAKVALVTISLWFMAWTPYLVINCMGLF-K
+F-E--GLTPLNTIWGACFAKSAACYNPIVYGISHPKYRLALKEKCPCCVF------GK-V
+DDGK--SSEAQSQA-TTSEA-ESKA-----------------------------------
+---------------------------------------------------------
+>    23== M12896   1 D.melanogaster Rh2 <>[Cell44,705-710'86]
+-----MERSHLP----ET------------PFDLAHSGPRFQA----------------Q
+SSG---------------NGSVLDNVLPDMAH--------LVNPYWSRFAPMDPMMSKIL
+GLFTLAIMIISCCGNGVVVYIFGGTKSLRTPANLLVLNLAFSDFCMMASQ-SPVMIINFY
+Y-ETWV--LGPLWCDIYAGCGSLFGCVSIWSMCMIAFDRYNVIVKGING-TPMTIKTSIM
+KILFIWMMAVFW-TVMPLIG-W-----SAYVPEGNLTACSIDYMT--RMWNPRSYLITYS
+LFVYYTPLFLICYSYWFIIAAVAAHEKAMREQAKK-------------------------
+--------------------------------------------------MN--------
+--VKSL------------------------------------------------------
+----------RS-SEDCDKS------AEGKLAKVALTTISLWFMAWTPYLVICYFGLF-K
+I-D--GLTPLTTIWGATFAKTSAVYNPIVYGISHPKYRIVLKEKCPMCVF------GN-T
+DEPK--PDAPASDTETTSEA-DSKA-----------------------------------
+---------------------------------------------------------
+>    24== X65878   1 Drosophila pseudoobscura Dpse\Rh2 <>[Genetics132(1),193-204'92
+-----MERSLLP----EP------------PLAMALLGPRFEA----------------Q
+TGG---------------NRSVLDNVLPDMAP--------LVNPHWSRFAPMDPTMSKIL
+GLFTLVILIISCCGNGVVVYIFGGTKSLRTPANLLVLNLAFSDFCMMASQ-SPVMIINFY
+Y-ETWV--LGPLWCDIYAACGSLFGCVSIWSMCMIAFDRYNVIVKGING-TPMTIKTSIM
+KIAFIWMMAVFW-TIMPLIG-W-----SSYVPEGNLTACSIDYMT--RQWNPRSYLITYS
+LFVYYTPLFMICYSYWFIIATVAAHEKAMRDQAKK-------------------------
+--------------------------------------------------MN--------
+--VKSL------------------------------------------------------
+----------RS-SEDCDKS------AENKLAKVALTTISLWFMAWTPYLIICYFGLF-K
+I-D--GLTPLTTIWGATFAKTSAVYNPIVYGISHPNDRLVLKEKCPMCVC------GT-T
+DEPK--PDAPPSDTETTSEA-ESKD-----------------------------------
+---------------------------------------------------------
+>    25== U26026   1 Apis mellifera long-wavelength rhodopsin <>[]
+--------------------------------MIAVSGPSYEA----------------F
+SYGG--QARF-------NNQTVVDKVPPDMLH--------LIDANWYQYPPLNPMWHGIL
+GFVIGMLGFVSAMGNGMVVYIFLSTKSLRTPSNLFVINLAISNFLMMFCM-SPPMVINCY
+Y-ETWV--LGPLFCQIYAMLGSLFGCGSIWTMTMIAFDRYNVIVKGLSG-KPLSINGALI
+RIIAIWLFSLGW-TIAPMFG-W-----NRYVPEGNMTACGTDYFN--RGLLSASYLVCYG
+IWVYFVPLFLIIYSYWFIIQAVAAHEKNMREQAKK-------------------------
+--------------------------------------------------MN--------
+--VASL------------------------------------------------------
+----------RS-SENQNTS------AECKLAKVALMTISLWFMAWTPYLVINFSGIF-N
+L-V--KISPLFTIWGSLFAKANAVYNPIVYGISHPKYRAALFAKFPSLAC-------A-A
+EPSS--DAVSTTSGTTTVTD-NEKSNA---------------------------------
+---------------------------------------------------------
+>    26== L03781   1 Limulus polyphemus opsin <>[PNAS90,6150-6154'93]
+----------------------------------MANQLSYSS----------------L
+GWPY--QP----------NASVVDTMPKEMLY--------MIHEHWYAFPPMNPLWYSIL
+GVAMIILGIICVLGNGMVIYLMMTTKSLRTPTNLLVVNLAFSDFCMMAFM-MPTMTSNCF
+A-ETWI--LGPFMCEVYGMAGSLFGCASIWSMVMITLDRYNVIVRGMAA-APLTHKKATL
+LLLFVWIWSGGW-TILPFFG-W-----SRYVPEGNLTSCTVDYLT--KDWSSASYVVIYG
+LAVYFLPLITMIYCYFFIVHAVAEHEKQLREQAKK-------------------------
+--------------------------------------------------MN--------
+--VASL------------------------------------------------------
+----------RANADQQKQS------AECRLAKVAMMTVGLWFMAWTPYLIISWAGVF-S
+SGT--RLTPLATIWGSVFAKANSCYNPIVYGISHPRYKAALYQRFPSLAC------GS-G
+ESGS--DVKSEASATTTMEE-KPKIPEA--------------------------------
+---------------------------------------------------------
+>    27== X07797   1 Octopus dofleini rhodopsin <>[FEBS232(1),69-72'88]
+---------------------------------------MVES----------------T
+TLVN--QT-WWY------NPTVD------------------IHPHWAKFDPIPDAVYYSV
+GIFIGVVGIIGILGNGVVIYLFSKTKSLQTPANMFIINLAMSDLSFSAINGFPLKTISAF
+M-KKWI--FGKVACQLYGLLGGIFGFMSINTMAMISIDRYNVIGRPMAASKKMSHRRAFL
+MIIFVWMWSIVW-SVGPVFN-W-----GAYVPEGILTSCSFDYLS--TDPSTRSFILCMY
+FCGFMLPIIIIAFCYFNIVMSVSNHEKEMAAMAKR-------------------------
+--------------------------------------------------LN--------
+--AKEL------------------------------------------------------
+----------R--KAQAGAS------AEMKLAKISMVIITQFMLSWSPYAIIALLAQF-G
+PAE--WVTPYAAELPVLFAKASAIHNPIVYSVSHPKFREAIQTTFPWLLTCCQFDEKE-C
+EDAN--DAEEEVVASER--G-GESRDAAQMKEMMAMMQKMQAQQAAYQPPPPPQGY--PP
+QGYPPQGAYPPPQGYPPQGYPPQGYPPQGYPPQGAPPQVEAPQGAPPQGVDNQAYQA
+>    28== X70498   1 Todarodes pacificus rhodopsin <retina>[FEBS317(1-2),5-11'93]
+----------------------------------------MGR----------------D
+LRDN--ET-WWY------NPSIV------------------VHPHWREFDQVPDAVYYSL
+GIFIGICGIIGCGGNGIVIYLFTKTKSLQTPANMFIINLAFSDFTFSLVNGFPLMTISCF
+L-KKWI--FGFAACKVYGFIGGIFGFMSIMTMAMISIDRYNVIGRPMAASKKMSHRRAFI
+MIIFVWLWSVLW-AIGPIFG-W-----GAYTLEGVLCNCSFDYIS--RDSTTRSNILCMF
+ILGFFGPILIIFFCYFNIVMSVSNHEKEMAAMAKR-------------------------
+--------------------------------------------------LN--------
+--AKEL------------------------------------------------------
+----------R--KAQAGAN------AEMRLAKISIVIVSQFLLSWSPYAVVALLAQF-G
+PLE--WVTPYAAQLPVMFAKASAIHNPMIYSVSHPKFREAISQTFPWVLTCCQFDDKE-T
+EDDK--DAETEIPAGESSDA-APSADAAQMKEMMAMMQKMQQQQAAY----PPQGYAPPP
+QGYPPQGY--PPQGYPPQGYPPQGYPP---PPQGAPPQ-GAPPAAPPQGVDNQAYQA
+>    29== L21195   1 human serotonin 5-HT7 receptor protein <placenta and fetal bra
+---------MMDVNSSGRPDLYGHLRSFL-LPEVGRGLPDLSPDGGA------------D
+PVAGSWAPHLLS------EVTASPAPTWDAPPDNASGCGEQIN--------YGRVEKVVI
+GSILTLITLLTIAGNCLVVISVCFVKKLRQPSNYLIVSLALADLSVAVAV-MPFVSVTDL
+IGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYLGITRPLTYPVRQNGKCMAK
+MILSVWLLSASI-TLPPLFG-W-----AQNVNDDKVCLISQDF----------GYTIYST
+AVAFYIPMSVMLFMYYQIY-------KAARKSAAKHKF----------------------
+---------------------------------PGFPRV----EPDSVIALNG-------
+--IVKL----------------------QK---------EVEECAN--------------
+----LSRLLKHERKNISIFK------REQKAATTLGIIVGAFTVCWLPFFLLSTARPFIC
+GTSCSCIPLWVERTFLWLGYANSLINPFIYAFFNRDLRTTYRSLLQCQYR----NINR--
+------KLSAAGMHEALKLAERPERPEF------------VLQNADY-------------
+--------------------------------------------CRKKGHDS-----
+>    30== L15228   1 rat 5HT-7 serotonin receptor <>[JBC268,18200-18204'93]
+------------------------------------------------------------
+------MPHLLS---GFLEVTASPAPTWDAPPDNVSGCGEQIN--------YGRVEKVVI
+GSILTLITLLTIAGNCLVVISVSFVKKLRQPSNYLIVSLALADLSVAVAV-MPFVSVTDL
+IGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYLGITRPLTYPVRQNGKCMAK
+MILSVWLLSASI-TLPPLFG-W-----AQNVNDDKVCLISQDF----------GYTIYST
+AVAFYIPMSVMLFMYYQIY-------KAARKSAAKHKF----------------------
+---------------------------------PGFPRV----QPESVISLNG-------
+--VVKL----------------------QK---------EVEECAN--------------
+----LSRLLKHERKNISIFK------REQKAATTLGIIVGAFTVCWLPFFLLSTARPFIC
+GTSCSCIPLWVERTCLWLGYANSLINPFIYAFFNRDLRPTSRSLLQCQYR----NINR--
+------KLSAAGMHEALKLAERPERSEF------------VLQNSDH-------------
+--------------------------------------------CGKKGHDT-----
+>    31=p A47425 serotonin receptor 5HT-7 - rat
+------------------------------------------------------------
+------MPHLLS---GFLEVTASPAPTWDAPPDNVSGCGEQIN--------YGRVEKVVI
+GSILTLITLLTIAGNCLVVISVSFVKKLRQPSNYLIVSLALADLSVAVAV-MPFVSVTDL
+IGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYLGITRPLTYPVRQNGKCMAK
+MILSVWLLSASI-TLPPLFG-W-----AQNVNDDKVCLISQDF----------GYTIYST
+AVAFYIPMSVMLFMYYQIY-------KAARKSAAKHKF----------------------
+---------------------------------PGFPRV----QPESVISLNG-------
+--VVKL----------------------QK---------EVEECAN--------------
+----LSRLLKHERKNISIFK------REQKAATTLGIIVGAFTVCWLPFFLLSTARPFIC
+GTSCSCIPLWVERTCLWLGYANSLINPFIYAFFNRDLRTTYRSLLQCQYR----NINR--
+------KLSAAGMHEALKLAERPERSEF------------VLQNSDH-------------
+--------------------------------------------CGKKGHDT-----
+>    32== M83181   1 human serotonin receptor <>[JBC267(11),7553-7562'92]
+----------MDVLSP--------------------------------------------
+---------------GQGNNTTSPPAPFET-GGNTTGISDVT---------VSYQ--VIT
+SLLLGTLIFCAVLGNACVVAAIALERSLQNVANYLIGSLAVTDLMVSVLV-LPMAALYQV
+L-NKWT--LGQVTCDLFIALDVLCCTSSILHLCAIALDRYWAITDPIDYVNKRTPRRAAA
+LISLTWLIGFLI-SIPPMLG-WRTPEDRSDPD---ACTISKDH----------GYTIYST
+FGAFYIPLLLMLVLYGRIF-------RAARFRIRK-------------------------
+--------------TVKKVEKTGADTRHGASPAPQPKKS-----------VNGESGSR--
+-------NWRLGVESKAGGALCANGAVRQGDDGAALEVIEVHRVGNSKEHLPLPSEAG--
+PTPCAPASFERKNERNAEAKRKMALARERKTVKTLGIIMGTFILCWLPFFIVALVLPF-C
+ESSC-HMPTLLGAIINWLGYSNSLLNPVIYAYFNKDFQNAFKKIIKCKFC----RQ----
+------------------------------------------------------------
+---------------------------------------------------------
+>    33=p A35181 serotonin receptor class 1A - rat
+----------MDVFSF--------------------------------------------
+---------------GQGNNTTASQEPFGT-GGNVTSISDVT---------FSYQ--VIT
+SLLLGTLIFCAVLGNACVVAAIALERSLQNVANYLIGSLAVTDLMVSVLV-LPMAALYQV
+L-NKWT--LGQVTCDLFIALDVLCCTSSILHLCAIALDRYWAITDPIDYVNKRTPRRAAA
+LISLTWLIGFLI-SIPPMLG-WRTPEDRSDPD---ACTISKDH----------GYTIYST
+FGAFYIPLLLMLVLYGRIF-------RAARFRIRK-------------------------
+--------------TVRKVEKKGAGTSLGTSSAPPPKKS-----------LNGQPGSG--
+-------DWRRCAENRAVGTPCTNGAVRQGDDEATLEVIEVHRVGNSKEHLPLPSESG--
+SNSYAPACLERKNERNAEAKRKMALARERKTVKTLGIIMGTFILCWLPFFIVALVLPF-C
+ESSC-HMPALLGAIINWLGYSNSLLNPVIYAYFNKDFQNAFKKIIKCKFC----RR----
+------------------------------------------------------------
+---------------------------------------------------------
+>    34== L06803   1 Lymnaea stagnalis serotonin receptor <>[PNAS90,11-15'93]
+MANFTFGDLALDVARMG-----GLASTPSGLRSTGLTTPGLSPTGLV------------T
+SDFN--DSYGLT---GQFINGSHSSRSRDNASANDTSATNMTDDRYWSLTVYSHEHLVLT
+SVILGLFVLCCIIGNCFVIAAVMLERSLHNVANYLILSLAVADLMVAVLV-MPLSVVSEI
+S-KVWF--LHSEVCDMWISVDVLCCTASILHLVAIAMDRYWAVTS-IDYIRRRSARRILL
+MIMVVWIVALFI-SIPPLFG-WRDP--NNDPDKTGTCIISQDK----------GYTIFST
+VGAFYLPMLVMMIIYIRIW-------LVARSRIRKDKFQMTKARLKTEETTLVASPKTEY
+SVVSDCNGCNSPDSTTEKKKRRAPFKSYGCSPRPERKKNRAKKLPENANGVNSNSSS---
+-------SERLKQIQIETAEAFANGCA----EEASIAMLERQ-CNNGKKISSNDTPYS--
+-----------RTREKLELK------RERKAARTLAIITGAFLICWLPFFIIALIGPF-V
+DPE--GIPPFARSFVLWLGYFNSLLNPIIYTIFSPEFRSAFQKILFGKYR----RGHR--
+------------------------------------------------------------
+---------------------------------------------------------
+>    35=p A47174 serotonin receptor, 5HTlym receptor - great pond snail
+MANFTFGDLALDVARMG-----GLASTPSGLRSTGLTTPGLSPTGLV------------T
+SDFN--DSYGLT---GQFINGSHSSRSRDNASANDTSATNMTDDRYWSLTVYSHEHLVLT
+SVILGLFVLCCIIGNCFVIAAVMLERSLHNVANYLILSLAVADLMVAVLV-MPLSVVSEI
+S-KVWF--LHSEVCDMWISVDVLCCTASILHLVAIAMDRYWAVTS-IDYIRRRSARRILL
+MIMVVWIVALFI-SIPPLFG-WRDP--NNDPDKTGTCIISQDK----------GYTIFST
+VGAFYLPMLVMMIIYIRIW-------LVARSRIRKDKFQMTKARLKTEETTLVASPKTEY
+SVVSDCNGCNSPDSTTEKKKRRAPFKSYGCSPRPERKKNRAKKLPENANGVNSNSSS---
+-------SERLKQIQIETAEAFANGCA----EEASIAMLERQ-CNNGKKISSNDTPYS--
+-----------RTREKLELK------RERKAARTLAIITGAFLICWLPFFIIALIGPF-V
+DPE--GIPPFARSFVLWLGYFNSLLNPIIYTIFSPEFRSAFQKILFGKYR----RGHR--
+------------------------------------------------------------
+---------------------------------------------------------
+>    36== X95604   1 Bombyx mori serotonin receptor <antennae>[InsectBiochem.Mol.Bi
+-MEGAEGQEELDWEAL-------YLRLP--LQNCSWNSTGWEPNWNV------------T
+VVPN--TTWW------------QASAPFDTPAALVRAAAK--------------------
+AVVLGLLILATVVGNVFVIAAILLERHLRSAANNLILSLAVADLLVACLV-MPLGAVYEV
+V-QRWT--LGPELCDMWTSGDVLCCTASILHLVAIALDRYWAVTN-IDYIHASTAKRVGM
+MIACVWTVSFFV-CIAQLLG-WKDPDWNQRVSEDLRCVVSQDV----------GYQIFAT
+ASSFYVPVLIILILYWRIY-------QTARKRIR--------------------------
+-------------------RRRGATARGGVGPPP---------VPAGGALVAGGGSGGIA
+AAVVAVIGRPLPTISETTTTGFTNVSS----NNTSP---EKQSCANGLEADPPTTGYGAV
+AAAYYPSLVRRKPKEAADSK------RERKAAKTLAIITGAFVACWLPFFVLAILVPT-C
+DCE---VSPVLTSLSLWLGYFNSTLNPVIYTVFSPEFRHAFQRLLCGRRV----RRRR--
+------A---------------PQ------------------------------------
+---------------------------------------------------------
+>     1== M63632   1 Lampetra japonica rhodopsin <>[BBRC174,1125-1132'91]
+----------------------------------------MNG----------------T
+E--G--DNFYVP----FSNKTGLARSPYEYPQY-------YLAEPWK---------YSAL
+AAYMFFLILVGFPVNFLTLF----------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+---------------------------------------------------------
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/mafft_custom_result.aln	Wed Apr 15 15:33:37 2020 -0400
@@ -0,0 +1,458 @@
+CLUSTAL format alignment by MAFFT F-INS-i (v7.455)
+
+
+1==             MN------------------------GTE--GDNFYVPFS--------NKTGL-ARSPYE
+2==             MN------------------------GTE--GPNFYVPFS--------NITGV-VRSPFE
+3==             MN------------------------GTE--GINFYVPMS--------NKTGV-VRSPFE
+4=p             MN------------------------GTE--GKNFYVPMS--------NRTGL-VRSPFE
+5=p             MN------------------------GTE--GNNFYVPLS--------NRTGL-VRSPFE
+6==             MK------------------------QVPEFHEDFYIPIP-------LDINNLSAYSPFL
+7==             MR------------------------KMS--EEEFYL------------FKNISSVGPWD
+8=opsin,        ------------------------------------------------------------
+9==             MAQQWSLQ-RLAGRHPQDS----YEDSTQ--SSIFTYTNS--------NS----TRGPFE
+10==            MAQQWSLQ-RLAGRHPQDS----YEDSTQ--SSIFTYTNS--------NS----TRGPFE
+11==            MTEAWNVAVFAARRSRDD------DDTTR--GSVFTYTNT--------NN----TRGPFE
+12==            MA-AWEAA-FAARRRHEE------EDTTR--DSVFTYTNS--------NN----TRGPFE
+13==            MS----------------------SNSSQ--------------AP--PNG----TPGPFD
+14==            MESG-NV-----------------------------------------SSSLFGNVSTAL
+15==            MEYH-NV------------------------------------------SSVLGNVSSVL
+16==            MEPLCNA------------------------------------------------SEPPL
+17==            MDALCNA------------------------------------------------SEPPL
+18==            MT-------------------------------------------------------NAT
+19==            MA-------------------------------------------------------NVT
+20==            ME-------------------------------------------------SFAVAAAQL
+21==            ME-------------------------------------------------SFAVAAAQL
+22==            MD-------------------------------------------------SFAAVATQL
+23==            MERS--------------------------------------------HLPETPFDLAHS
+24==            MERS--------------------------------------------LLPEPPLAMALL
+25==            MI-------------------------------------------------------AVS
+26==            M-----------------------------------------------------------
+27==            MVESTT------------------------------------------------------
+28==            MGRD--------------------------------------------------------
+29==            MM-----DVNSSGRPDLYGH-----------LRSFLLPEVGRGLPDLSPDGGADPVAGSW
+30==            M-----------------------------------------------------------
+31=p            M-----------------------------------------------------------
+32==            MD------VLSPGQ----------------------------------GNNTTSPPAPFE
+33=p            MD------VFSFGQ----------------------------------GNNTTASQEPFG
+34==            MA------NFTFGDLALDVARMGGLASTPS------------------GLRSTGLTTPGL
+35=p            MA------NFTFGDLALDVARMGGLASTPS------------------GLRSTGLTTPGL
+36==            ME-------GAEGQEELD-------------WEALYLRL---------PLQNCSWNSTGW
+                                                                            
+
+1==             YP----------------------------------------------------------
+2==             QP----------------------------------------------------------
+3==             YP----------------------------------------------------------
+4=p             YP----------------------------------------------------------
+5=p             YP----------------------------------------------------------
+6==             VP----------------------------------------------------------
+7==             GP----------------------------------------------------------
+8=opsin,        ------------------------------------------------------------
+9==             GP----------------------------------------------------------
+10==            GP----------------------------------------------------------
+11==            GP----------------------------------------------------------
+12==            GP----------------------------------------------------------
+13==            GP----------------------------------------------------------
+14==            RPEARL----------------------SAETRLLGWNVPPEELRHIPEHWL--------
+15==            RPDARL----------------------SAESRLLGWNVPPDELRHIPEHWL--------
+16==            RPEAR-SSG-------------------NGDLQFLGWNVPPDQIQYIPEHWL--------
+17==            RPEARMSSG-------------------SDELQFLGWNVPPDQIQYIPEHWL--------
+18==            GPQMAYYGAASMDFG-------------YPEGVSIVDFVRPEIKPYVHQHWY--------
+19==            GPQMAFYGSGAATFG-------------YPEGMTVADFVPDRVKHMVLDHWY--------
+20==            GPHFAPLS-----------------------NGSVVDKVTPDMAHLISPYWN--------
+21==            GPHFAPLS-----------------------NGSVVDKVTPDMAHLISPYWN--------
+22==            GPQFAAPS-----------------------NGSVVDKVTPDMAHLISPYWD--------
+23==            GPRFQAQSSG---------------------NGSVLDNVLPDMAHLVNPYWS--------
+24==            GPRFEAQTGG---------------------NRSVLDNVLPDMAPLVNPHWS--------
+25==            GPSYEAFSYG--GQA-------------RFNNQTVVDKVPPDMLHLIDANWY--------
+26==            -ANQLSYSSL--GWP-------------YQPNASVVDTMPKEMLYMIHEHWY--------
+27==            ----------LVNQT-------------WWYNPTV----------DIHPHWA--------
+28==            ---------LRDNET-------------WWYNPSI----------VVHPHWR--------
+29==            APHLLS-----------------------------------EVTASPAPTWDAPPDNASG
+30==            -PHLLSGF--------------------------------LEVTASPAPTWDAPPDNVSG
+31=p            -PHLLSGF--------------------------------LEVTASPAPTWDAPPDNVSG
+32==            TG--------------------------------------GNTTGI--------------
+33=p            TG--------------------------------------GNVTSI--------------
+34==            SPTGLVTSDFNDSYGLTGQFINGSHSSRSRDNASANDTSATNMTD--DRYWSL-------
+35=p            SPTGLVTSDFNDSYGLTGQFINGSHSSRSRDNASANDTSATNMTD--DRYWSL-------
+36==            EPNW-------------------------------------NVTVVPNTTWWQ-------
+                                                                            
+
+1==             -----QY-YLAEPWKYSALAAYMFFLILVGFPVNFLTLFVTVQHKKLRTPLNYILLNLAM
+2==             -----QY-YLAEPWQFSMLAAYMFLLIVLGFPINFLTLYVTVQHKKLRTPLNYILLNLAV
+3==             -----QY-YLAEPWKYRLVCCYIFFLISTGLPINLLTLLVTFKHKKLRQPLNYILVNLAV
+4=p             -----QY-YLAEPWQFKILALYLFFLMSMGLPINGLTLVVTAQHKKLRQPLNFILVNLAV
+5=p             -----QY-YLAEPWQFKLLAVYMFFLICLGLPINGLTLICTAQHKKLRQPLNFILVNLAV
+6==             -----QD-HLGNQGIFMAMSVFMFFIFIGGASINILTILCTIQFKKLRSHLNYILVNLSI
+7==             -----QY-HIAPVWAFYLQAAFMGTVFLIGFPLNAMVLVATLRYKKLRQPLNYILVNVSF
+8=opsin,        ------------------------------------------------------------
+9==             -----NY-HIAPRWVYHLTSVWMIFVVIASVFTNGLVLAATMKFKKLRHPLNWILVNLAV
+10==            -----NY-HIAPRWVYHLTSVWMIFVVTASVFTNGLVLAATMKFKKLRHPLNWILVNLAV
+11==            -----NY-HIAPRWVYNLVSFFMIIVVIASCFTNGLVLVATAKFKKLRHPLNWILVNLAF
+12==            -----NY-HIAPRWVYNLTSVWMIFVVAASVFTNGLVLVATWKFKKLRHPLNWILVNLAV
+13==            -----QWPYQAPQSTYVGVAVLMGTVVACASVVNGLVIVVSICYKKLRSPLNYILVNLAV
+14==            -----TY-PEPPESMNYLLGTLYIFFTLMSMLGNGLVIWVFSAAKSLRTPSNILVINLAF
+15==            -----IY-PEPPESMNYLLGTLYIFFTVISMIGNGLVMWVFSAAKSLRTPSNILVINLAF
+16==            -----TQ-LEPPASMHYMLGVFYIFLFCASTVGNGMVIWIFSTSKSLRTPSNMFVLNLAV
+17==            -----TQ-LEPPASMHYMLGVFYIFLFFASTLGNGMVIWIFSTSKSLRTPSNMFVLNLAV
+18==            -----NY-PPVNPMWHYLLGVIYLFLGTVSIFGNGLVIYLFNKSAALRTPANILVVNLAL
+19==            -----NY-PPVNPMWHYLLGVVYLFLGVISIAGNGLVIYLYMKSQALKTPANMLIVNLAL
+20==            -----QF-PAMDPIWAKILTAYMIMIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAI
+21==            -----QF-PAMDPIWAKILTAYMIMIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAI
+22==            -----QF-PAMDPIWAKILTAYMIIIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAI
+23==            -----RF-APMDPMMSKILGLFTLAIMIISCCGNGVVVYIFGGTKSLRTPANLLVLNLAF
+24==            -----RF-APMDPTMSKILGLFTLVILIISCCGNGVVVYIFGGTKSLRTPANLLVLNLAF
+25==            -----QY-PPLNPMWHGILGFVIGMLGFVSAMGNGMVVYIFLSTKSLRTPSNLFVINLAI
+26==            -----AF-PPMNPLWYSILGVAMIILGIICVLGNGMVIYLMMTTKSLRTPTNLLVVNLAF
+27==            -----KF-DPIPDAVYYSVGIFIGVVGIIGILGNGVVIYLFSKTKSLQTPANMFIINLAM
+28==            -----EF-DQVPDAVYYSLGIFIGICGIIGCGGNGIVIYLFTKTKSLQTPANMFIINLAF
+29==            CGEQINY----GRVEKVVIGSILTLITLLTIAGNCLVVISVCFVKKLRQPSNYLIVSLAL
+30==            CGEQINY----GRVEKVVIGSILTLITLLTIAGNCLVVISVSFVKKLRQPSNYLIVSLAL
+31=p            CGEQINY----GRVEKVVIGSILTLITLLTIAGNCLVVISVSFVKKLRQPSNYLIVSLAL
+32==            SDVTVSY--------QVITSLLLGTLIFCAVLGNACVVAAIALERSLQNVANYLIGSLAV
+33=p            SDVTFSY--------QVITSLLLGTLIFCAVLGNACVVAAIALERSLQNVANYLIGSLAV
+34==            TVYSHEH--------LVLTSVILGLFVLCCIIGNCFVIAAVMLERSLHNVANYLILSLAV
+35=p            TVYSHEH--------LVLTSVILGLFVLCCIIGNCFVIAAVMLERSLHNVANYLILSLAV
+36==            --ASAPFDTPAALVRAAAKAVVLGLLILATVVGNVFVIAAILLERHLRSAANNLILSLAV
+                                                                            
+
+1==             ANLFMVLFG-FTVTMYTSMNG-YFV--FGPTMCSIEGFFATLGGEVALWSLVVLAIERYI
+2==             ADLFMVFGG-FTTTLYTSLHG-YFV--FGPTGCNLEGFFATLGGEIGLWSLVVLAIERYV
+3==             ADLFMACFG-FTVTFYTAWNG-YFV--FGPVGCAVEGFFATLGGQVALWSLVVLAIERYI
+4=p             AGTIMVCFG-FTVTFYTAING-YFV--LGPTGCAVEGFMATLGGEVALWSLVVLAIERYI
+5=p             AGAIMVCFG-FTVTFYTAING-YFA--LGPTGCAVEGFMATLGGEVALWSLVVLAIERYI
+6==             ANLFVAIFG-SPLSFYSFFNR-YFI--FGATACKIEGFLATLGGMVGLWSLAVVAFERWL
+7==             GGFLLCIFS-VFPVFVASCNG-YFV--FGRHVCALEGFLGTVAGLVTGWSLAFLAFERYI
+8=opsin,        -DLAETVIA-STISIVNQVSG-YFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWL
+9==             ADLAETVIA-STISVVNQVYG-YFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWM
+10==            ADLAETVIA-STISIVNQVSG-YFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWL
+11==            VDLVETLVA-STISVFNQIFG-YFI--LGHPLCVIEGYVVSSCGITGLWSLAIISWERWF
+12==            ADLGETVIA-STISVINQISG-YFI--LGHPMCVVEGYTVSACGITALWSLAIISWERWF
+13==            ADLLVTLCG-SSVSLSNNING-FFV--FGRRMCELEGFMVSLTGIVGLWSLAILALERYV
+14==            CDFMMMVK--TPIFIYNSFHQ-GYA--LGHLGCQIFGIIGSYTGIAAGATNAFIAYDRFN
+15==            CDFMMMIK--TPIFIYNSFHQ-GYA--LGHLGCQIFGVIGSYTGIAAGATNAFIAYDRYN
+16==            FDLIMCLK--APIF--NSFHR-GFAIYLGNTWCQIFASIGSYSGIGAGMTNAAIGYDRYN
+17==            FDLIMCLK--APIFIYNSFHR-GFA--LGNTWCQIFASIGSYSGIGAGMTNAAIGYDRYN
+18==            SDLIMLTTN-VPFFTYNCFSGGVWM--FSPQYCEIYACLGAITGVCSIWLLCMISFDRYN
+19==            SDLIMLTTN-FPPFCYNCFSGGRWM--FSGTYCEIYAALGAITGVCSIWTLCMISFDRYN
+20==            SDFGIMITN-TPMMGINLYFE-TWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQ
+21==            SDFGIMITN-TPMMGINLYFE-TWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQ
+22==            SDFGIMITN-TPMMGINLYFE-TWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQ
+23==            SDFCMMASQ-SPVMIINFYYE-TWV--LGPLWCDIYAGCGSLFGCVSIWSMCMIAFDRYN
+24==            SDFCMMASQ-SPVMIINFYYE-TWV--LGPLWCDIYAACGSLFGCVSIWSMCMIAFDRYN
+25==            SNFLMMFCM-SPPMVINCYYE-TWV--LGPLFCQIYAMLGSLFGCGSIWTMTMIAFDRYN
+26==            SDFCMMAFM-MPTMTSNCFAE-TWI--LGPFMCEVYGMAGSLFGCASIWSMVMITLDRYN
+27==            SDLSFSAINGFPLKTISAFMK-KWI--FGKVACQLYGLLGGIFGFMSINTMAMISIDRYN
+28==            SDFTFSLVNGFPLMTISCFLK-KWI--FGFAACKVYGFIGGIFGFMSIMTMAMISIDRYN
+29==            ADLSVAVAV-MPFVSVTDLIGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYL
+30==            ADLSVAVAV-MPFVSVTDLIGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYL
+31=p            ADLSVAVAV-MPFVSVTDLIGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYL
+32==            TDLMVSVLV-LPMAALYQVLN-KWT--LGQVTCDLFIALDVLCCTSSILHLCAIALDRYW
+33=p            TDLMVSVLV-LPMAALYQVLN-KWT--LGQVTCDLFIALDVLCCTSSILHLCAIALDRYW
+34==            ADLMVAVLV-MPLSVVSEISK-VWF--LHSEVCDMWISVDVLCCTASILHLVAIAMDRYW
+35=p            ADLMVAVLV-MPLSVVSEISK-VWF--LHSEVCDMWISVDVLCCTASILHLVAIAMDRYW
+36==            ADLLVACLV-MPLGAVYEVVQ-RWT--LGPELCDMWTSGDVLCCTASILHLVAIALDRYW
+                 .                     :   :    * :                  :  :*: 
+
+1==             VICKPMGNFR-FGNTHAIMGVAFTWIMALACA-APPLV-GWSRYIPEGMQCSCGPDYYTL
+2==             VVCKPMSNFR-FGENHAIMGVAFTWVMALACA-APPLV-GWSRYIPEGMQCSCGIDYYTL
+3==             VVCKPMGNFR-FSATHAMMGIAFTWVMAFSCA-APPLF-GWSRYMPEGMQCSCGPDYYTH
+4=p             VVCKPMGSFK-FSSSHAFAGIAFTWVMALACA-APPLF-GWSRYIPEGMQCSCGPDYYTL
+5=p             VVCKPMGSFK-FSSTHASAGIAFTWVMAMACA-APPLV-GWSRYIPEGIQCSCGPDYYTL
+6==             VICKPLGNFT-FKTPHAIAGCILPWISALAAS-LPPLF-GWSRYIPEGLQCSCGPDWYTT
+7==             VICKPFGNFR-FSSKHALTVVLATWTIGIGVS-IPPFF-GWSRFIPEGLQCSCGPDWYTV
+8=opsin,        VVCKPFGNVR-FDAKLAIVGIAFSWIWAAVWT-APPIF-GWSRYWPHGLKTSCGPDVFSG
+9==             VVCKPFGNVR-FDAKLAIVGIAFSWIWAAVWT-APPIF-GWSRYWPHGLKTSCGPDVFSG
+10==            VVCKPFGNVR-FDAKLAIVGIAFSWIWSAVWT-APPIF-GWSRYWPHGLKTSCGPDVFSG
+11==            VVCKPFGNIK-FDSKLAIIGIVFSWVWAWGWS-APPIF-GWSRYWPHGLKTSCGPDVFSG
+12==            VVCKPFGNIK-FDGKLAVAGILFSWLWSCAWT-APPIF-GWSRYWPHGLKTSCGPDVFSG
+13==            VVCKPLGDFQ-FQRRHAVSGCAFTWGWALLWS-APPLL-GWSSYVPEGLRTSCGPNWYTG
+14==            VITRPMEGK--MTHGKAIAMIIFIYMYATPWV-VACYTETWGRFVPEGYLTSCTFDYLTD
+15==            VITRPMEGK--MTHGKAIAMIIFIYLYATPWV-VACYTESWGRFVPEGYLTSCTFDYLTD
+16==            VITKPMNRN--MTFTKAVIMNIIIWLYCTPWV-VLPLTQFWDRFVPEGYLTSCSFDYLSD
+17==            VITKPMNRN--MTFTKAVIMNIIIWLYCTPWV-VLPLTQFWDRFVPEGYLTSCSFDYLSD
+18==            IICNGFNGPK-LTTGKAVVFALISWVIAIGCA-LPPFF-GWGNYILEGILDSCSYDYLTQ
+19==            IICNGFNGPK-LTQGKATFMCGLAWVISVGWS-LPPFF-GWGSYTLEGILDSCSYDYFTR
+20==            VIVKGMAGRP-MTIPLALGKM----------------------YVPEGNLTSCGIDYLER
+21==            VIVKGMAGRP-MTIPLALGKIAYIWFMSSIWC-LAPAF-GWSRYVPEGNLTSCGIDYLER
+22==            VIVKGMAGRP-MTIPLALGKIAYIWFMSTIWCCLAPVF-GWSRYVPEGNLTSCGIDYLER
+23==            VIVKGINGTP-MTIKTSIMKILFIWMMAVFWT-VMPLI-GWSAYVPEGNLTACSIDYMTR
+24==            VIVKGINGTP-MTIKTSIMKIAFIWMMAVFWT-IMPLI-GWSSYVPEGNLTACSIDYMTR
+25==            VIVKGLSGKP-LSINGALIRIIAIWLFSLGWT-IAPMF-GWNRYVPEGNMTACGTDYFNR
+26==            VIVRGMAAAP-LTHKKATLLLLFVWIWSGGWT-ILPFF-GWSRYVPEGNLTSCTVDYLTK
+27==            VIGRPMAASKKMSHRRAFLMIIFVWMWSIVWS-VGPVF-NWGAYVPEGILTSCSFDYLST
+28==            VIGRPMAASKKMSHRRAFIMIIFVWLWSVLWA-IGPIF-GWGAYTLEGVLCNCSFDYISR
+29==            GITRPLTYPVRQNGKCMAKMILSVWLLSASIT-LPPLF-GWAQNVNDDKVC-----LISQ
+30==            GITRPLTYPVRQNGKCMAKMILSVWLLSASIT-LPPLF-GWAQNVNDDKVC-----LISQ
+31=p            GITRPLTYPVRQNGKCMAKMILSVWLLSASIT-LPPLF-GWAQNVNDDKVC-----LISQ
+32==            AITDPIDYVNKRTPRRAAALISLTWLIGFLIS-IPPML-GWRTPEDRSDPDAC---TISK
+33=p            AITDPIDYVNKRTPRRAAALISLTWLIGFLIS-IPPML-GWRTPEDRSDPDAC---TISK
+34==            AVTS-IDYIRRRSARRILLMIMVVWIVALFIS-IPPLF-GWRD--PNNDPDKTGTCIISQ
+35=p            AVTS-IDYIRRRSARRILLMIMVVWIVALFIS-IPPLF-GWRD--PNNDPDKTGTCIISQ
+36==            AVTN-IDYIHASTAKRVGMMIACVWTVSFFVC-IAQLL-GWKDPDWNQRVSEDLRCVVSQ
+                 :   :                                                      
+
+1==             NPNFNNESYVVYMFVVHFLVPFVIIFFCYGRLLCTVKEAAAAQQE---------------
+2==             KPEVNNESFVIYMFVVHFTIPMIVIFFCYGQLVFTVKEAAAQQQE---------------
+3==             NPDYHNESYVLYMFVIHFIIPVVVIFFSYGRLICKVREAAAQQQE---------------
+4=p             NPDYNNESYVIYMFVCHFILPVAVIFFTYGRLVCTVKAAAAQQQD---------------
+5=p             NPEYNNESYVLYMFICHFILPVTIIFFTYGRLVCTVKAAAAQQQD---------------
+6==             NNKYNNESYVMFLFCFCFAVPFGTIVFCYGQLLITLKLAAKAQAD---------------
+7==             GTKYRSESYTWFLFIFCFIVPLSLICFSYTQLLRALKAVAAQQQE---------------
+8=opsin,        SSYPGVQSYMIVLMVTCCITPLSIIVLCYLQVWLAIRAVAKQQKE---------------
+9==             SSYPGVQSYMIVLMVTCCITPLSIIVLCYLQVWLAIRAVAKQQKE---------------
+10==            SSYPGVQSYMIVLMVTCCIIPLAIIMLCYLQVWLAIRAVAKQQKE---------------
+11==            SVELGCQSFMLTLMITCCFLPLFIIIVCYLQVWMAIRAVAAQQKE---------------
+12==            SSDPGVQSYMVVLMVTCCFFPLAIIILCYLQVWLAIRAVAAQQKE---------------
+13==            GS--NNNSYILSLFVTCFVLPLSLILFSYTNLLLTLRAAAAQQKE---------------
+14==            NF--DTRLFVACIFFFSFVCPTTMITYYYSQIVGHVFSHEKALRDQAKKMNVESLRSNV-
+15==            NF--DTRLFVACIFFFSFVCPTTMITYYYSQIVGHVFSHEKALRDQAKKMNVDSLRSNV-
+16==            NF--DTRLFVGTIFFFSFVCPTLMILYYYSQIVGHVFSHEKALREQAKKMNVESLRSNV-
+17==            NF--DTRLFVGTIFLFSFVVPTLMILYYYSQIVGHVFNHEKALREQAKKMNVESLRSNV-
+18==            DF--NTFSYNIFIFVFDYFLPAAIIVFSYVFIVKAIFAHEAAMRAQAKKMNVSTLRSN--
+19==            DM--NTITYNICIFIFDFFLPASVIVFSYVFIVKAIFAHEAAMRAQAKKMNVTNLRSN--
+20==            DW--NPRSYLIFYSIFVYYIPLFLICYSYWFIIAAVSAHEKAMREQAKKMNVKSLRSS--
+21==            DW--NPRSYLIFYSIFVYYIPLFLICYSYWFIIAAVSAHEKAMREQAKKMNVKSLRSS--
+22==            DW--NPRSYLIFYSIFVYYIPLFLICYSYWFIIAAVSAHEKAMREQAKKMNVKSLRSS--
+23==            MW--NPRSYLITYSLFVYYTPLFLICYSYWFIIAAVAAHEKAMREQAKKMNVKSLRSS--
+24==            QW--NPRSYLITYSLFVYYTPLFMICYSYWFIIATVAAHEKAMRDQAKKMNVKSLRSS--
+25==            GL--LSASYLVCYGIWVYFVPLFLIIYSYWFIIQAVAAHEKNMREQAKKMNVASLRSS--
+26==            DW--SSASYVVIYGLAVYFLPLITMIYCYFFIVHAVAEHEKQLREQAKKMNVASLRANA-
+27==            DP--STRSFILCMYFCGFMLPIIIIAFCYFNIVMSVSNHEKEMAAMAKRLNAKELRKA--
+28==            DS--TTRSNILCMFILGFFGPILIIFFCYFNIVMSVSNHEKEMAAMAKRLNAKELRKA--
+29==            D-----FGYTIYSTAVAFYIPMSVMLFMYYQIYKAARKSAAKHKFP--------------
+30==            D-----FGYTIYSTAVAFYIPMSVMLFMYYQIYKAARKSAAKHKFP--------------
+31=p            D-----FGYTIYSTAVAFYIPMSVMLFMYYQIYKAARKSAAKHKFP--------------
+32==            D-----HGYTIYSTFGAFYIPLLLMLVLYGRIFRAARFRIRKTVKKVEKTGADTRHGASP
+33=p            D-----HGYTIYSTFGAFYIPLLLMLVLYGRIFRAARFRIRKTVRKVEKKGAGTSLGTSS
+34==            D-----KGYTIFSTVGAFYLPMLVMMIIYIRIWLVARSRIRKDKFQMTKARLKTEETTLV
+35=p            D-----KGYTIFSTVGAFYLPMLVMMIIYIRIWLVARSRIRKDKFQMTKARLKTEETTLV
+36==            D-----VGYQIFATASSFYVPVLIILILYWRIYQTARKRIRRRRGA-------TARGGVG
+                                    *   :   *  :                            
+
+1==             ------------------------------------------------------------
+2==             ------------------------------------------------------------
+3==             ------------------------------------------------------------
+4=p             ------------------------------------------------------------
+5=p             ------------------------------------------------------------
+6==             ------------------------------------------------------------
+7==             ------------------------------------------------------------
+8=opsin,        ------------------------------------------------------------
+9==             ------------------------------------------------------------
+10==            ------------------------------------------------------------
+11==            ------------------------------------------------------------
+12==            ------------------------------------------------------------
+13==            ------------------------------------------------------------
+14==            ------------------------------------------------------------
+15==            ------------------------------------------------------------
+16==            ------------------------------------------------------------
+17==            ------------------------------------------------------------
+18==            ------------------------------------------------------------
+19==            ------------------------------------------------------------
+20==            ------------------------------------------------------------
+21==            ------------------------------------------------------------
+22==            ------------------------------------------------------------
+23==            ------------------------------------------------------------
+24==            ------------------------------------------------------------
+25==            ------------------------------------------------------------
+26==            ------------------------------------------------------------
+27==            ------------------------------------------------------------
+28==            ------------------------------------------------------------
+29==            GFPRVE--------------------------------PDSVI----------ALNGIVK
+30==            GFPRVQ--------------------------------PESVI----------SLNGVVK
+31=p            GFPRVQ--------------------------------PESVI----------SLNGVVK
+32==            A-PQPKKS-VNGESGSRNWRLGVESKAGGAL-----C-----------------ANGAVR
+33=p            A-PPPKKS-LNGQPGSGDWRRCAENRAVGTP-----C-----------------TNGAVR
+34==            ASPKTEYSVVSDCNGCNSPDSTTEKKKRRAPFKSYGCSPRPERKKNRAKKLPENANGV--
+35=p            ASPKTEYSVVSDCNGCNSPDSTTEKKKRRAPFKSYGCSPRPERKKNRAKKLPENANGV--
+36==            PPPVPAGGALVAGGGSGGIAAAVVAVIGR---------PLPTISET-------TTTGFTN
+                                                                            
+
+1==             ------------------------------------------------------------
+2==             ------------------------------------------------------------
+3==             ------------------------------------------------------------
+4=p             ------------------------------------------------------------
+5=p             ------------------------------------------------------------
+6==             ------------------------------------------------------------
+7==             ------------------------------------------------------------
+8=opsin,        ------------------------------------------------------------
+9==             ------------------------------------------------------------
+10==            ------------------------------------------------------------
+11==            ------------------------------------------------------------
+12==            ------------------------------------------------------------
+13==            ------------------------------------------------------------
+14==            ------------------------------------------------------------
+15==            ------------------------------------------------------------
+16==            ------------------------------------------------------------
+17==            ------------------------------------------------------------
+18==            ------------------------------------------------------------
+19==            ------------------------------------------------------------
+20==            ------------------------------------------------------------
+21==            ------------------------------------------------------------
+22==            ------------------------------------------------------------
+23==            ------------------------------------------------------------
+24==            ------------------------------------------------------------
+25==            ------------------------------------------------------------
+26==            ------------------------------------------------------------
+27==            ------------------------------------------------------------
+28==            ------------------------------------------------------------
+29==            -------------LQKEVEEC-AN------------------LSRLLKHER---------
+30==            -------------LQKEVEEC-AN------------------LSRLLKHER---------
+31=p            -------------LQKEVEEC-AN------------------LSRLLKHER---------
+32==            QGDDGAALEV-----IEVHRV-GNSKEHLPLPSEAGP--TPCAPASFERKNERN------
+33=p            QGDDEATLEV-----IEVHRV-GNSKEHLPLPSESGS--NSYAPACLERKNERN------
+34==            -NSNSSSSERLKQIQIETAEAFANGC------------AEEASIAMLERQCNNGKKISSN
+35=p            -NSNSSSSERLKQIQIETAEAFANGC------------AEEASIAMLERQCNNGKKISSN
+36==            VSSNNTSP--------EKQSC-ANGLEADPPTTGYGAVAAAYYPSLVRRKP---------
+                                                                            
+
+1==             --------SASTQKAEKEVTRMVVLMVIGFLVCWVPYASVAFYIFT--HQGSDFGAT-FM
+2==             --------SATTQKAEKEVTRMVIIMVIFFLICWLPYASVAMYIFT--HQGSNFGPI-FM
+3==             --------SATTQKAEKEVTRMVILMVLGFMLAWTPYAVVAFWIFT--NKGADFTAT-LM
+4=p             --------SASTQKAEREVTKMVILMVFGFLIAWTPYATVAAWIFF--NKGADFSAK-FM
+5=p             --------SASTQKAEREVTKMVILMVLGFLVAWTPYATVAAWIFF--NKGAAFSAQ-FM
+6==             --------SASTQKAEREVTKMVVVMVLGFLVCWAPYASFSLWIVS--HRGEEFDLR-MA
+7==             --------SATTQKAEREVSRMVVVMVGSFCVCYVPYAAFAMYMVN--NRNHGLDLR-LV
+8=opsin,        --------SESTQKAEKEVTRMVVVMVLAFC-----------------------------
+9==             --------SESTQKAEKEVTRMVVVMVLAFCFCWGPYAFFACFAAA--NPGYPFHPL-MA
+10==            --------SESTQKAEKEVTRMVVVMIFAYCVCWGPYTFFACFAAA--NPGYAFHPL-MA
+11==            --------SESTQKAEREVSRMVVVMIVAFCICWGPYASFVSFAAA--NPGYAFHPL-AA
+12==            --------SESTQKAEKEVSRMVVVMIVAYCFCWGPYTFFACFAAA--NPGYAFHPL-AA
+13==            --------ADTTQRAEREVTRMVIVMVMAFLLCWLPYSTFALVVAT--HKGIIIQPV-LA
+14==            --------DKNKETAEIRIAKAAITICFLFFCSWTPYGVMSLIGAF--GDKTLLTPG-AT
+15==            --------DKSKEAAEIRIAKAAITICFLFFASWTPYGVMSLIGAF--GDKTLLTPG-AT
+16==            --------DKSKETAEIRIAKAAITICFLFFVSWTPYGVMSLIGAF--GDKSLLTQG-AT
+17==            --------DKSKETAEIRIAKAAITICFLFFVSWTPYGVMSLIGAF--GDKSLLTPG-AT
+18==            --------EADAQRAEIRIAKTALVNVSLWFICWTPYALISLKGVM--GDTSGITPL-VS
+19==            --------EAETQRAEIRIAKTALVNVSLWFICWTPYAAITIQGLL--GNAEGITPL-LT
+20==            --------EDAEKSAEGKLAKVALVTITLWFMAWTPYLVINCMGLF--KF-EGLTPL-NT
+21==            --------EDAEKSAEGKLAKVALVTITLWFMAWTPYLVINCMGLF--KF-EGLTPL-NT
+22==            --------EDADKSAEGKLAKVALVTISLWFMAWTPYLVINCMGLF--KF-EGLTPL-NT
+23==            --------EDCDKSAEGKLAKVALTTISLWFMAWTPYLVICYFGLF--KI-DGLTPL-TT
+24==            --------EDCDKSAENKLAKVALTTISLWFMAWTPYLIICYFGLF--KI-DGLTPL-TT
+25==            --------ENQNTSAECKLAKVALMTISLWFMAWTPYLVINFSGIF--NL-VKISPL-FT
+26==            --------DQQKQSAECRLAKVAMMTVGLWFMAWTPYLIISWAGVF--SSGTRLTPL-AT
+27==            --------Q-AGASAEMKLAKISMVIITQFMLSWSPYAIIALLAQF--GPAEWVTPY-AA
+28==            --------Q-AGANAEMRLAKISIVIVSQFLLSWSPYAVVALLAQF--GPLEWVTPY-AA
+29==            -------KNISIFKREQKAATTLGIIVGAFTVCWLPFFLLSTARPFICGTSCSCIPLWVE
+30==            -------KNISIFKREQKAATTLGIIVGAFTVCWLPFFLLSTARPFICGTSCSCIPLWVE
+31=p            -------KNISIFKREQKAATTLGIIVGAFTVCWLPFFLLSTARPFICGTSCSCIPLWVE
+32==            ----AEAKRKMALARERKTVKTLGIIMGTFILCWLPFFIVALVLPF-CESSCHMPTL-LG
+33=p            ----AEAKRKMALARERKTVKTLGIIMGTFILCWLPFFIVALVLPF-CESSCHMPAL-LG
+34==            DTPYSRTREKLELKRERKAARTLAIITGAFLICWLPFFIIALIGPF--VDPEGIPPF-AR
+35=p            DTPYSRTREKLELKRERKAARTLAIITGAFLICWLPFFIIALIGPF--VDPEGIPPF-AR
+36==            -------KEAADSKRERKAAKTLAIITGAFVACWLPFFVLAILVPT-CD--CEVSPV-LT
+                               * .           :                              
+
+1==             TLPAFFAKSSALYNPVIYILMNKQFRNCMITTL-----CC-----GKNPLGDDE-SGA-S
+2==             TLPAFFAKTASIYNPIIYIMMNKQFRNCMLTSL-----CC-----GKNPLGDDE-ASA-T
+3==             AVPAFFSKSSSLYNPIIYVLMNKQFRNCMITTI-----CC-----GKNPFGDEDVSSTVS
+4=p             AIPAFFSKSSALYNPVIYVLLNKQFRNCMLTTI-----FC-----GKNPLGDDE-SSTVS
+5=p             AIPAFFSKTSALYNPVIYVLLNKQFRSCMLTTL-----FC-----GKNPLGDEE-SSTVS
+6==             TIPSCLSKASTVYNPVIYVLMNKQFRSCMMK-M-----VC-----GKN-IEEDE-AST-S
+7==             TIPSFFSKSACIYNPIIYCFMNKQFQACIMK-M-----VC-----GKA-MTDES-DTC-S
+8=opsin,        ------------------------------------------------------------
+9==             ALPAFFAKSATIYNPVIYVFMNRQFRNCILQ-L-----F------GKK-VDDGS-ELS-S
+10==            ALPAYFAKSATIYNPVIYVFMNRQFRNCILQ-L-----F------GKK-VDDGS-ELS-S
+11==            ALPAYFAKSATIYNPVIYVFMNRQFRNCIMQ-L-----F------GKK-VDDGS-EAS-T
+12==            ALPAYFAKSATIYNPIIYVFMNRQFRNCILQ-L-----F------GKK-VDDGS-EVS-T
+13==            SLPSYFSKTATVYNPIIYVFMNKQFQSCLLEML-----CC-----GYQPQRTGKASPGTP
+14==            MIPACACKMVACIDPFVYAISHPRYRMELQKRCPW---LALN---EK----APE-SSA-V
+15==            MIPACTCKMVACIDPFVYAISHPRYRMELQKRCPW---LAIS---EK----APE-SRA-A
+16==            MIPACTCKLVACIDPFVYAISHPRYRLELQKRCPW---LGVN---EK----SGE-ISS-A
+17==            MIPACTCKLVACIEPFVYAISHPRYRMELQKRCPW---LGVN---EK----SGE-ASS-A
+18==            TLPALLAKSCSCYNPFVYAISHPKYRLAITQHLPW---FCVH---ET----ETK-SND-D
+19==            TLPALLAKSCSCYNPFVYAISHPKFRLAITQHLPW---FCVH---EK----DPN-DVE-E
+20==            IWGACFAKSAACYNPIVYGISHPKYRLALKEKCP----CCVF---GKV--DDGK-SSD-A
+21==            IWGACFAKSAACYNPIVYGISHPKYRLALKEKCP----CCVF---GKV--DDGK-SSD-A
+22==            IWGACFAKSAACYNPIVYGISHPKYRLALKEKCP----CCVF---GKV--DDGK-SSE-A
+23==            IWGATFAKTSAVYNPIVYGISHPKYRIVLKEKCP----MCVF---GNT--DEPK-PDA-P
+24==            IWGATFAKTSAVYNPIVYGISHPNDRLVLKEKCP----MCVC---GTT--DEPK-PDA-P
+25==            IWGSLFAKANAVYNPIVYGISHPKYRAALFAKFP----SLAC---AA----EPS-SDA-V
+26==            IWGSVFAKANSCYNPIVYGISHPRYKAALYQRFP----SLAC---GS---GESG-SDV-K
+27==            ELPVLFAKASAIHNPIVYSVSHPKFREAIQTTFPWLLTCCQF---DEK--ECED-AND-A
+28==            QLPVMFAKASAIHNPMIYSVSHPKFREAISQTFPWVLTCCQF---DDK--ETED-DKD-A
+29==            RTFLWLGYANSLINPFIYAFFNRDLRTTYRSLL-----QCQYRNINRKL------SAAGM
+30==            RTCLWLGYANSLINPFIYAFFNRDLRPTSRSLL-----QCQYRNINRKL------SAAGM
+31=p            RTCLWLGYANSLINPFIYAFFNRDLRTTYRSLL-----QCQYRNINRKL------SAAGM
+32==            AIINWLGYSNSLLNPVIYAYFNKDFQNAFKKII-----KCKF---CRQ------------
+33=p            AIINWLGYSNSLLNPVIYAYFNKDFQNAFKKII-----KCKF---CRR------------
+34==            SFVLWLGYFNSLLNPIIYTIFSPEFRSAFQKIL-----FGKYR-RGHR------------
+35=p            SFVLWLGYFNSLLNPIIYTIFSPEFRSAFQKIL-----FGKYR-RGHR------------
+36==            SLSLWLGYFNSTLNPVIYTVFSPEFRHAFQRLL------CGRRVRRRR------------
+                                                                            
+
+1==             TSKTEVSSVSTS------------------------------------------------
+2==             ASKTETSQVA--------------------------------------------------
+3==             QSKTEVSSVSSS------------------------------------------------
+4=p             TSKTEVSSVS--------------------------------------------------
+5=p             TSKTEVSSVS--------------------------------------------------
+6==             SQVTQVSSVA--------------------------------------------------
+7==             SQKTEVSTVSST------------------------------------------------
+8=opsin,        ------------------------------------------------------------
+9==             ASKTEVSSVS--------------------------------------------------
+10==            ASKTEVSSVS--------------------------------------------------
+11==            TSRTEVSSVSNS------------------------------------------------
+12==            -SRTEVSSVSNS------------------------------------------------
+13==            GPHADVTAAGLR------------------------------------------------
+14==            ASTS-TTQEPQ-------------------------------------------------
+15==            ISTS-TTQEQQ-------------------------------------------------
+16==            QSTT-TQEQ-Q-------------------------------------------------
+17==            QSTT-TQEQTQ-------------------------------------------------
+18==            SQSNSTVAQDK-------------------------------------------------
+19==            NQSSNTQTQEK-------------------------------------------------
+20==            QSQA-TASEAE-------------------------------------------------
+21==            QSQA-TASEAE-------------------------------------------------
+22==            QSQA-TTSEAE-------------------------------------------------
+23==            ASDTETTSEAD-------------------------------------------------
+24==            PSDTETTSEAE-------------------------------------------------
+25==            STTSGTTTVTDN------------------------------------------------
+26==            SEASATTTMEEK------------------------------------------------
+27==            EEEV-VASERG--GESRDAAQMKEMMAMMQKMQAQQAAYQPPPPPQGY--PPQGYPPQGA
+28==            ETEI-PAGESSDAAPSADAAQMKEMMAMMQKMQQQQAAY----PPQGYAPPPQGYPPQG-
+29==            HEALKLAERPERP-----------------EFVLQNA-----------------------
+30==            HEALKLAERPERS-----------------EFVLQNS-----------------------
+31=p            HEALKLAERPERS-----------------EFVLQNS-----------------------
+32==            ------------------------------------------------------------
+33=p            ------------------------------------------------------------
+34==            ------------------------------------------------------------
+35=p            ------------------------------------------------------------
+36==            ------------------------------------------------------------
+                                                                            
+
+1==             --------------------------------------------PVSP-A---
+2==             -----------------------------------------------P-A---
+3==             --------------------------------------------QVSP-A---
+4=p             -----------------------------------------------P-A---
+5=p             -----------------------------------------------P-A---
+6==             -----------------------------------------------PEK---
+7==             --------------------------------------------QVGP-N---
+8=opsin,        -----------------------------------------------------
+9==             --------------------------------------------SVSP-A---
+10==            --------------------------------------------SVSP-A---
+11==            --------------------------------------------SVAP-A---
+12==            --------------------------------------------SVSP-A---
+13==            -------------------------------------------NKVMP-AHPV
+14==            --------------------------------------------QTTA-A---
+15==            --------------------------------------------QTTA-A---
+16==            --------------------------------------------QTTA-A---
+17==            --------------------------------------------QTSA-A---
+18==            -------------------------------------------------A---
+19==            -------------------------------------------------S---
+20==            ----------------------------------------------SK-A---
+21==            ----------------------------------------------SK-A---
+22==            ----------------------------------------------SK-A---
+23==            ----------------------------------------------SK-A---
+24==            ----------------------------------------------SK-D---
+25==            -------------------------------------------EK-SN-A---
+26==            -------------------------------------------PKIPE-A---
+27==            YPPPQGYPPQGYPPQGYPPQGYPPQGAPPQVEAPQGAPPQGVDNQAYQ-A---
+28==            YPP-QGYPPQGYPPQGYPP---PPQGAPPQ-GAPPAAPPQGVDNQAYQ-A---
+29==            -------------------------------------------DYCRKKGHDS
+30==            -------------------------------------------DHCGKKGHDT
+31=p            -------------------------------------------DHCGKKGHDT
+32==            -----------------------------------------------------
+33=p            -----------------------------------------------------
+34==            -----------------------------------------------------
+35=p            -----------------------------------------------------
+36==            -------------------------------------------------A-PQ
+                                                                     
--- a/test-data/mafft_fftns_result.aln	Sat Nov 11 15:06:34 2017 -0500
+++ b/test-data/mafft_fftns_result.aln	Wed Apr 15 15:33:37 2020 -0400
@@ -1,504 +1,468 @@
 >     1== M63632   1 Lampetra japonica rhodopsin <>[BBRC174,1125-1132'91]
---------------------------------MNGTE--------------GDNF-----
--------------YVP-----F-SNKTG----------LARSPYEYPQY-YLAEPWK---
---------------YSALAAYMFFLILVGFPVNFLTLFVTVQHKKLRTPLNYILLNLAMA
-NLFMVLFG-FTVTMYTSMN-GYFV--FGPTMCSIEGFFATLGGEVALWSLVVLAIERYIV
-ICKPMGN-FRFGNTHAIMGVAFTWIMALAC-AAPPLVG-W-----SRYIPEGMQCSCGPD
-YYTLNPNFNNESYVVYMFVVHFLVPFVIIFFCYGRLLCTV----KE--------------
-------------------------------------------------------AAAAQQ
+----------------------------------------MNG----------------T
+E--G--DNFYVP----FSNKTGLARSPYEYPQY-------YLAEPWK---------YSAL
+AAYMFFLILVGFPVNFLTLFVTVQHKKLRTPLNYILLNLAMANLFMVLFG-FTVTMYTSM
+N-GYFV--FGPTMCSIEGFFATLGGEVALWSLVVLAIERYIVICKPMGN-FRFGNTHAIM
+GVAFTWIMALAC-AAPPLVG-W-----SRYIPEGMQCSCGPDYYTLNPNFNNESYVVYMF
+VVHFLVPFVIIFFCYGRLLCTV----KEAAAAQQ--------------------------
 ------------------------------------------------------------
---------------------ESASTQK------AEKEVTRMVVLMVIGFLVCWVPYASVA
-FYIFT-HQGS--DFGATFMTLPAFFAKSSALYNPVIYILMNKQFRNCMITTLCC------
---GKNPLGDDE--SGASTSKTEVSSVS-TSPVS---------------------------
------------------------------------PA-----------------------
---
+------------------------------------------------------------
+-------------ESASTQK------AEKEVTRMVVLMVIGFLVCWVPYASVAFYIFT-H
+QGS--DFGATFMTLPAFFAKSSALYNPVIYILMNKQFRNCMITTLCC--------GKNPL
+GDDE--SGASTSKTEVSSVS-TSPVSPA--------------------------------
+---------------------------------------------------------
 >     2== U22180   1 rat opsin <rod>[J.Mol.Neurosci.5(3),207-209'94]
---------------------------------MNGTE--------------GPNF-----
--------------YVP-----F-SNITG----------VVRSPFEQPQY-YLAEPWQ---
---------------FSMLAAYMFLLIVLGFPINFLTLYVTVQHKKLRTPLNYILLNLAVA
-DLFMVFGG-FTTTLYTSLH-GYFV--FGPTGCNLEGFFATLGGEIGLWSLVVLAIERYVV
-VCKPMSN-FRFGENHAIMGVAFTWVMALAC-AAPPLVG-W-----SRYIPEGMQCSCGID
-YYTLKPEVNNESFVIYMFVVHFTIPMIVIFFCYGQLVFTV----KE--------------
-------------------------------------------------------AAAQQQ
+----------------------------------------MNG----------------T
+E--G--PNFYVP----FSNITGVVRSPFEQPQY-------YLAEPWQ---------FSML
+AAYMFLLIVLGFPINFLTLYVTVQHKKLRTPLNYILLNLAVADLFMVFGG-FTTTLYTSL
+H-GYFV--FGPTGCNLEGFFATLGGEIGLWSLVVLAIERYVVVCKPMSN-FRFGENHAIM
+GVAFTWVMALAC-AAPPLVG-W-----SRYIPEGMQCSCGIDYYTLKPEVNNESFVIYMF
+VVHFTIPMIVIFFCYGQLVFTV----KEAAAQQQ--------------------------
 ------------------------------------------------------------
---------------------ESATTQK------AEKEVTRMVIIMVIFFLICWLPYASVA
-MYIFT-HQGS--NFGPIFMTLPAFFAKTASIYNPIIYIMMNKQFRNCMLTSLCC------
---GKNPLGDDE--ASATASKTE------TSQVA---------------------------
------------------------------------PA-----------------------
---
+------------------------------------------------------------
+-------------ESATTQK------AEKEVTRMVIIMVIFFLICWLPYASVAMYIFT-H
+QGS--NFGPIFMTLPAFFAKTASIYNPIIYIMMNKQFRNCMLTSLCC--------GKNPL
+GDDE--ASATASKTE------TSQVAPA--------------------------------
+---------------------------------------------------------
 >     3== M92038   1 chicken green sensitive cone opsin <retina>[PNAS89,5932-5936'9
---------------------------------MNGTE--------------GINF-----
--------------YVP-----M-SNKTG----------VVRSPFEYPQY-YLAEPWK---
---------------YRLVCCYIFFLISTGLPINLLTLLVTFKHKKLRQPLNYILVNLAVA
-DLFMACFG-FTVTFYTAWN-GYFV--FGPVGCAVEGFFATLGGQVALWSLVVLAIERYIV
-VCKPMGN-FRFSATHAMMGIAFTWVMAFSC-AAPPLFG-W-----SRYMPEGMQCSCGPD
-YYTHNPDYHNESYVLYMFVIHFIIPVVVIFFSYGRLICKV----RE--------------
-------------------------------------------------------AAAQQQ
+----------------------------------------MNG----------------T
+E--G--INFYVP----MSNKTGVVRSPFEYPQY-------YLAEPWK---------YRLV
+CCYIFFLISTGLPINLLTLLVTFKHKKLRQPLNYILVNLAVADLFMACFG-FTVTFYTAW
+N-GYFV--FGPVGCAVEGFFATLGGQVALWSLVVLAIERYIVVCKPMGN-FRFSATHAMM
+GIAFTWVMAFSC-AAPPLFG-W-----SRYMPEGMQCSCGPDYYTHNPDYHNESYVLYMF
+VIHFIIPVVVIFFSYGRLICKV----REAAAQQQ--------------------------
 ------------------------------------------------------------
---------------------ESATTQK------AEKEVTRMVILMVLGFMLAWTPYAVVA
-FWIFT-NKGA--DFTATLMAVPAFFSKSSSLYNPIIYVLMNKQFRNCMITTICC------
---GKNPFGDEDVSSTVSQSKTEVSSVS-SSQVS---------------------------
------------------------------------PA-----------------------
---
+------------------------------------------------------------
+-------------ESATTQK------AEKEVTRMVILMVLGFMLAWTPYAVVAFWIFT-N
+KGA--DFTATLMAVPAFFSKSSSLYNPIIYVLMNKQFRNCMITTICC--------GKNPF
+GDEDVSSTVSQSKTEVSSVS-SSQVSPA--------------------------------
+---------------------------------------------------------
 >     4=p A45229 opsin, green-sensitive (clone GFgr-1) - goldfish
---------------------------------MNGTE--------------GKNF-----
--------------YVP-----M-SNRTG----------LVRSPFEYPQY-YLAEPWQ---
---------------FKILALYLFFLMSMGLPINGLTLVVTAQHKKLRQPLNFILVNLAVA
-GTIMVCFG-FTVTFYTAIN-GYFV--LGPTGCAVEGFMATLGGEVALWSLVVLAIERYIV
-VCKPMGS-FKFSSSHAFAGIAFTWVMALAC-AAPPLFG-W-----SRYIPEGMQCSCGPD
-YYTLNPDYNNESYVIYMFVCHFILPVAVIFFTYGRLVCTV----KA--------------
-------------------------------------------------------AAAQQQ
+----------------------------------------MNG----------------T
+E--G--KNFYVP----MSNRTGLVRSPFEYPQY-------YLAEPWQ---------FKIL
+ALYLFFLMSMGLPINGLTLVVTAQHKKLRQPLNFILVNLAVAGTIMVCFG-FTVTFYTAI
+N-GYFV--LGPTGCAVEGFMATLGGEVALWSLVVLAIERYIVVCKPMGS-FKFSSSHAFA
+GIAFTWVMALAC-AAPPLFG-W-----SRYIPEGMQCSCGPDYYTLNPDYNNESYVIYMF
+VCHFILPVAVIFFTYGRLVCTV----KAAAAQQQ--------------------------
 ------------------------------------------------------------
---------------------DSASTQK------AEREVTKMVILMVFGFLIAWTPYATVA
-AWIFF-NKGA--DFSAKFMAIPAFFSKSSALYNPVIYVLLNKQFRNCMLTTIFC------
---GKNPLGDDE-SSTVSTSKTEVSS------VS---------------------------
------------------------------------PA-----------------------
---
+------------------------------------------------------------
+-------------DSASTQK------AEREVTKMVILMVFGFLIAWTPYATVAAWIFF-N
+KGA--DFSAKFMAIPAFFSKSSALYNPVIYVLLNKQFRNCMLTTIFC--------GKNPL
+GDDE-SSTVSTSKTEVSS------VSPA--------------------------------
+---------------------------------------------------------
 >     5=p B45229 opsin, green-sensitive (clone GFgr-2) - goldfish
---------------------------------MNGTE--------------GNNF-----
--------------YVP-----L-SNRTG----------LVRSPFEYPQY-YLAEPWQ---
---------------FKLLAVYMFFLICLGLPINGLTLICTAQHKKLRQPLNFILVNLAVA
-GAIMVCFG-FTVTFYTAIN-GYFA--LGPTGCAVEGFMATLGGEVALWSLVVLAIERYIV
-VCKPMGS-FKFSSTHASAGIAFTWVMAMAC-AAPPLVG-W-----SRYIPEGIQCSCGPD
-YYTLNPEYNNESYVLYMFICHFILPVTIIFFTYGRLVCTV----KA--------------
-------------------------------------------------------AAAQQQ
+----------------------------------------MNG----------------T
+E--G--NNFYVP----LSNRTGLVRSPFEYPQY-------YLAEPWQ---------FKLL
+AVYMFFLICLGLPINGLTLICTAQHKKLRQPLNFILVNLAVAGAIMVCFG-FTVTFYTAI
+N-GYFA--LGPTGCAVEGFMATLGGEVALWSLVVLAIERYIVVCKPMGS-FKFSSTHASA
+GIAFTWVMAMAC-AAPPLVG-W-----SRYIPEGIQCSCGPDYYTLNPEYNNESYVLYMF
+ICHFILPVTIIFFTYGRLVCTV----KAAAAQQQ--------------------------
 ------------------------------------------------------------
---------------------DSASTQK------AEREVTKMVILMVLGFLVAWTPYATVA
-AWIFF-NKGA--AFSAQFMAIPAFFSKTSALYNPVIYVLLNKQFRSCMLTTLFC------
---GKNPLGDEE-SSTVSTSKTEVSS------VS---------------------------
------------------------------------PA-----------------------
---
+------------------------------------------------------------
+-------------DSASTQK------AEREVTKMVILMVLGFLVAWTPYATVAAWIFF-N
+KGA--AFSAQFMAIPAFFSKTSALYNPVIYVLLNKQFRSCMLTTLFC--------GKNPL
+GDEE-SSTVSTSKTEVSS------VSPA--------------------------------
+---------------------------------------------------------
 >     6== L11864   1 Carassius auratus blue cone opsin <retina>[Biochemistry32,208-
---------------------------------MKQVPEF------------HEDF-----
--------------YIPIP-LDI-NNLS------------AYSPFLVPQD-HLGNQGI---
---------------FMAMSVFMFFIFIGGASINILTILCTIQFKKLRSHLNYILVNLSIA
-NLFVAIFG-SPLSFYSFFN-RYFI--FGATACKIEGFLATLGGMVGLWSLAVVAFERWLV
-ICKPLGN-FTFKTPHAIAGCILPWISALAA-SLPPLFG-W-----SRYIPEGLQCSCGPD
-WYTTNNKYNNESYVMFLFCFCFAVPFGTIVFCYGQLLITL----KL--------------
-------------------------------------------------------AAKAQA
+----------------------------------------MKQ----------------V
+PEFH--EDFYIPIPLDINNLS--AYSPFLVPQD-------HLGNQGI---------FMAM
+SVFMFFIFIGGASINILTILCTIQFKKLRSHLNYILVNLSIANLFVAIFG-SPLSFYSFF
+N-RYFI--FGATACKIEGFLATLGGMVGLWSLAVVAFERWLVICKPLGN-FTFKTPHAIA
+GCILPWISALAA-SLPPLFG-W-----SRYIPEGLQCSCGPDWYTTNNKYNNESYVMFLF
+CFCFAVPFGTIVFCYGQLLITL----KLAAKAQA--------------------------
 ------------------------------------------------------------
---------------------DSASTQK------AEREVTKMVVVMVLGFLVCWAPYASFS
-LWIVS-HRGE--EFDLRMATIPSCLSKASTVYNPVIYVLMNKQFRSCMM-KMVC------
---GKN-IEEDE--ASTSSQVTQVSS------VA---------------------------
------------------------------------PEK----------------------
---
+------------------------------------------------------------
+-------------DSASTQK------AEREVTKMVVVMVLGFLVCWAPYASFSLWIVS-H
+RGE--EFDLRMATIPSCLSKASTVYNPVIYVLMNKQFRSCMM-KMVC--------GKN-I
+EEDE--ASTSSQVTQVSS------VAPEK-------------------------------
+---------------------------------------------------------
 >     7== M13299   1 human BCP <>[Science232(4747),193-202'86]
---------------------------------MRKMS--------------EEEF-----
--------------YL------F-KNIS------------SVGPWDGPQY-HIAPVWA---
---------------FYLQAAFMGTVFLIGFPLNAMVLVATLRYKKLRQPLNYILVNVSFG
-GFLLCIFS-VFPVFVASCN-GYFV--FGRHVCALEGFLGTVAGLVTGWSLAFLAFERYIV
-ICKPFGN-FRFSSKHALTVVLATWTIGIGV-SIPPFFG-W-----SRFIPEGLQCSCGPD
-WYTVGTKYRSESYTWFLFIFCFIVPLSLICFSYTQLLRAL----KA--------------
-------------------------------------------------------VAAQQQ
+----------------------------------------MRK----------------M
+S--E--EEFYL-----FKNIS--SVGPWDGPQY-------HIAPVWA---------FYLQ
+AAFMGTVFLIGFPLNAMVLVATLRYKKLRQPLNYILVNVSFGGFLLCIFS-VFPVFVASC
+N-GYFV--FGRHVCALEGFLGTVAGLVTGWSLAFLAFERYIVICKPFGN-FRFSSKHALT
+VVLATWTIGIGV-SIPPFFG-W-----SRFIPEGLQCSCGPDWYTVGTKYRSESYTWFLF
+IFCFIVPLSLICFSYTQLLRAL----KAVAAQQQ--------------------------
 ------------------------------------------------------------
---------------------ESATTQK------AEREVSRMVVVMVGSFCVCYVPYAAFA
-MYMVN-NRNH--GLDLRLVTIPSFFSKSACIYNPIIYCFMNKQFQACIM-KMVC------
---GKA-MTDES--DTCSSQKTEVSTVS-STQVG---------------------------
------------------------------------PN-----------------------
---
+------------------------------------------------------------
+-------------ESATTQK------AEREVSRMVVVMVGSFCVCYVPYAAFAMYMVN-N
+RNH--GLDLRLVTIPSFFSKSACIYNPIIYCFMNKQFQACIM-KMVC--------GKA-M
+TDES--DTCSSQKTEVSTVS-STQVGPN--------------------------------
+---------------------------------------------------------
 >     8=opsin, greensensitive  human (fragment) S07060
 ------------------------------------------------------------
 ------------------------------------------------------------
+------------------------------------------DLAETVIA-STISIVNQV
+S-GYFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWLVVCKPFGN-VRFDAKLAIV
+GIAFSWIWAAVW-TAPPIFG-W-----SRYWPHGLKTSCGPDVFSGSSYPGVQSYMIVLM
+VTCCITPLSIIVLCYLQVWLAI----RAVAKQQK--------------------------
 ------------------------------------------------------------
-DLAETVIA-STISIVNQVS-GYFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWLV
-VCKPFGN-VRFDAKLAIVGIAFSWIWAAVW-TAPPIFG-W-----SRYWPHGLKTSCGPD
-VFSGSSYPGVQSYMIVLMVTCCITPLSIIVLCYLQVWLAI----RA--------------
-------------------------------------------------------VAKQQK
+------------------------------------------------------------
+-------------ESESTQK------AEKEVTRMVVVMVLAFC-----------------
+------------------------------------------------------------
+------------------------------------------------------------
+---------------------------------------------------------
+>     9== K03494   1 human GCP <>[Science232(4747),193-202'86]
+----------------------------------------MAQQWSLQRLAGRHPQDSYE
+DSTQ--SSIFT-----YTNSNS-TRGPFEGPNY-------HIAPRWV---------YHLT
+SVWMIFVVIASVFTNGLVLAATMKFKKLRHPLNWILVNLAVADLAETVIA-STISVVNQV
+Y-GYFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWMVVCKPFGN-VRFDAKLAIV
+GIAFSWIWAAVW-TAPPIFG-W-----SRYWPHGLKTSCGPDVFSGSSYPGVQSYMIVLM
+VTCCITPLSIIVLCYLQVWLAI----RAVAKQQK--------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+-------------ESESTQK------AEKEVTRMVVVMVLAFCFCWGPYAFFACFAAA-N
+PGY--PFHPLMAALPAFFAKSATIYNPVIYVFMNRQFRNCIL-QLF---------GKK-V
+DDGS--ELSSASKTEVSSV---SSVSPA--------------------------------
+---------------------------------------------------------
+>    10== Z68193   1 human Red Opsin <>[]
+----------------------------------------MAQQWSLQRLAGRHPQDSYE
+DSTQ--SSIFT-----YTNSNS-TRGPFEGPNY-------HIAPRWV---------YHLT
+SVWMIFVVTASVFTNGLVLAATMKFKKLRHPLNWILVNLAVADLAETVIA-STISIVNQV
+S-GYFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWLVVCKPFGN-VRFDAKLAIV
+GIAFSWIWSAVW-TAPPIFG-W-----SRYWPHGLKTSCGPDVFSGSSYPGVQSYMIVLM
+VTCCIIPLAIIMLCYLQVWLAI----RAVAKQQK--------------------------
+------------------------------------------------------------
 ------------------------------------------------------------
---------------------ESESTQK------AEKEVTRMVVVMVLAFC----------
+-------------ESESTQK------AEKEVTRMVVVMIFAYCVCWGPYTFFACFAAA-N
+PGY--AFHPLMAALPAYFAKSATIYNPVIYVFMNRQFRNCIL-QLF---------GKK-V
+DDGS--ELSSASKTEVSSV---SSVSPA--------------------------------
+---------------------------------------------------------
+>    11== M92036   1 Gecko gecko P521 <retina>[PNAS89,6841-6845'92]
+----------------------------------------MTEAWNVAVFAARRSRDD-D
+DTTR--GSVFT-----YTNTNN-TRGPFEGPNY-------HIAPRWV---------YNLV
+SFFMIIVVIASCFTNGLVLVATAKFKKLRHPLNWILVNLAFVDLVETLVA-STISVFNQI
+F-GYFI--LGHPLCVIEGYVVSSCGITGLWSLAIISWERWFVVCKPFGN-IKFDSKLAII
+GIVFSWVWAWGW-SAPPIFG-W-----SRYWPHGLKTSCGPDVFSGSVELGCQSFMLTLM
+ITCCFLPLFIIIVCYLQVWMAI----RAVAAQQK--------------------------
+------------------------------------------------------------
 ------------------------------------------------------------
+-------------ESESTQK------AEREVSRMVVVMIVAFCICWGPYASFVSFAAA-N
+PGY--AFHPLAAALPAYFAKSATIYNPVIYVFMNRQFRNCIM-QLF---------GKK-V
+DDGS--EASTTSRTEVSSVS-NSSVAPA--------------------------------
+---------------------------------------------------------
+>    12== M62903   1 chicken visual pigment <>[BBRC173,1212-1217'90]
+----------------------------------------MAA-WEAAFAARRRHEE--E
+DTTR--DSVFT-----YTNSNN-TRGPFEGPNY-------HIAPRWV---------YNLT
+SVWMIFVVAASVFTNGLVLVATWKFKKLRHPLNWILVNLAVADLGETVIA-STISVINQI
+S-GYFI--LGHPMCVVEGYTVSACGITALWSLAIISWERWFVVCKPFGN-IKFDGKLAVA
+GILFSWLWSCAW-TAPPIFG-W-----SRYWPHGLKTSCGPDVFSGSSDPGVQSYMVVLM
+VTCCFFPLAIIILCYLQVWLAI----RAVAAQQK--------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+-------------ESESTQK------AEKEVSRMVVVMIVAYCFCWGPYTFFACFAAA-N
+PGY--AFHPLAAALPAYFAKSATIYNPIIYVFMNRQFRNCIL-QLF---------GKK-V
+DDGS--EVST-SRTEVSSVS-NSSVSPA--------------------------------
+---------------------------------------------------------
+>    13== S75720   1 chicken P-opsin <>[Science267(5203),1502-1506'95]
+----------------------------------------MS-----------------S
+NSSQ--AP-----------PNG-TPGPFDGPQW------PYQAPQST---------YVGV
+AVLMGTVVACASVVNGLVIVVSICYKKLRSPLNYILVNLAVADLLVTLCG-SSVSLSNNI
+N-GFFV--FGRRMCELEGFMVSLTGIVGLWSLAILALERYVVVCKPLGD-FQFQRRHAVS
+GCAFTWGWALLW-SAPPLLG-W-----SSYVPEGLRTSCGPNWYTGGSNN--NSYILSLF
+VTCFVLPLSLILFSYTNLLLTL----RAAAAQQK--------------------------
 ------------------------------------------------------------
 ------------------------------------------------------------
---
->     9== K03494   1 human GCP <>[Science232(4747),193-202'86]
---------------------------------MAQQWSLQRLAGRHPQDSYEDST-----
--------------QSSI--FTY-TNSNS-----------TRGPFEGPNY-HIAPRWV---
---------------YHLTSVWMIFVVIASVFTNGLVLAATMKFKKLRHPLNWILVNLAVA
-DLAETVIA-STISVVNQVY-GYFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWMV
-VCKPFGN-VRFDAKLAIVGIAFSWIWAAVW-TAPPIFG-W-----SRYWPHGLKTSCGPD
-VFSGSSYPGVQSYMIVLMVTCCITPLSIIVLCYLQVWLAI----RA--------------
-------------------------------------------------------VAKQQK
-------------------------------------------------------------
---------------------ESESTQK------AEKEVTRMVVVMVLAFCFCWGPYAFFA
-CFAAA-NPGY--PFHPLMAALPAFFAKSATIYNPVIYVFMNRQFRNCIL-QLF-------
---GKK-VDDGS--ELSSASKTEVSSV---SSVS---------------------------
------------------------------------PA-----------------------
---
->    10== Z68193   1 human Red Opsin <>[]
---------------------------------MAQQWSLQRLAGRHPQDSYEDST-----
--------------QSSI--FTY-TNSNS-----------TRGPFEGPNY-HIAPRWV---
---------------YHLTSVWMIFVVTASVFTNGLVLAATMKFKKLRHPLNWILVNLAVA
-DLAETVIA-STISIVNQVS-GYFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWLV
-VCKPFGN-VRFDAKLAIVGIAFSWIWSAVW-TAPPIFG-W-----SRYWPHGLKTSCGPD
-VFSGSSYPGVQSYMIVLMVTCCIIPLAIIMLCYLQVWLAI----RA--------------
-------------------------------------------------------VAKQQK
-------------------------------------------------------------
---------------------ESESTQK------AEKEVTRMVVVMIFAYCVCWGPYTFFA
-CFAAA-NPGY--AFHPLMAALPAYFAKSATIYNPVIYVFMNRQFRNCIL-QLF-------
---GKK-VDDGS--ELSSASKTEVSSV---SSVS---------------------------
------------------------------------PA-----------------------
---
->    11== M92036   1 Gecko gecko P521 <retina>[PNAS89,6841-6845'92]
---------------------------------MTEAWNVAVFAARRSRDD-DDTT-----
--------------RGSV--FTY-TNTNN-----------TRGPFEGPNY-HIAPRWV---
---------------YNLVSFFMIIVVIASCFTNGLVLVATAKFKKLRHPLNWILVNLAFV
-DLVETLVA-STISVFNQIF-GYFI--LGHPLCVIEGYVVSSCGITGLWSLAIISWERWFV
-VCKPFGN-IKFDSKLAIIGIVFSWVWAWGW-SAPPIFG-W-----SRYWPHGLKTSCGPD
-VFSGSVELGCQSFMLTLMITCCFLPLFIIIVCYLQVWMAI----RA--------------
-------------------------------------------------------VAAQQK
-------------------------------------------------------------
---------------------ESESTQK------AEREVSRMVVVMIVAFCICWGPYASFV
-SFAAA-NPGY--AFHPLAAALPAYFAKSATIYNPVIYVFMNRQFRNCIM-QLF-------
---GKK-VDDGS--EASTTSRTEVSSVS-NSSVA---------------------------
------------------------------------PA-----------------------
---
->    12== M62903   1 chicken visual pigment <>[BBRC173,1212-1217'90]
---------------------------------MAA-WEAAFAARRRHEE--EDTT-----
--------------RDSV--FTY-TNSNN-----------TRGPFEGPNY-HIAPRWV---
---------------YNLTSVWMIFVVAASVFTNGLVLVATWKFKKLRHPLNWILVNLAVA
-DLGETVIA-STISVINQIS-GYFI--LGHPMCVVEGYTVSACGITALWSLAIISWERWFV
-VCKPFGN-IKFDGKLAVAGILFSWLWSCAW-TAPPIFG-W-----SRYWPHGLKTSCGPD
-VFSGSSDPGVQSYMVVLMVTCCFFPLAIIILCYLQVWLAI----RA--------------
-------------------------------------------------------VAAQQK
-------------------------------------------------------------
---------------------ESESTQK------AEKEVSRMVVVMIVAYCFCWGPYTFFA
-CFAAA-NPGY--AFHPLAAALPAYFAKSATIYNPIIYVFMNRQFRNCIL-QLF-------
---GKK-VDDGS--EVST-SRTEVSSVS-NSSVS---------------------------
------------------------------------PA-----------------------
---
->    13== S75720   1 chicken P-opsin <>[Science267(5203),1502-1506'95]
---------------------------------MS-----------------SNSS-----
--------------QAP---------PNG-----------TPGPFDGPQWPYQAPQST---
---------------YVGVAVLMGTVVACASVVNGLVIVVSICYKKLRSPLNYILVNLAVA
-DLLVTLCG-SSVSLSNNIN-GFFV--FGRRMCELEGFMVSLTGIVGLWSLAILALERYVV
-VCKPLGD-FQFQRRHAVSGCAFTWGWALLW-SAPPLLG-W-----SSYVPEGLRTSCGPN
-WYTGGSNN--NSYILSLFVTCFVLPLSLILFSYTNLLLTL----RA--------------
-------------------------------------------------------AAAQQK
-------------------------------------------------------------
---------------------EADTTQR------AEREVTRMVIVMVMAFLLCWLPYSTFA
-LVVAT-HKGI--IIQPVLASLPSYFSKTATVYNPIIYVFMNKQFQSCLL-EMLCCGY---
--QPQR-TGKAS--PGTPGPHADVTAAGLRNKVM---------------------------
------------------------------------PAHPV--------------------
---
+-------------EADTTQR------AEREVTRMVIVMVMAFLLCWLPYSTFALVVAT-H
+KGI--IIQPVLASLPSYFSKTATVYNPIIYVFMNKQFQSCLL-EMLCCGY----QPQR-T
+GKAS--PGTPGPHADVTAAGLRNKVMPAHPV-----------------------------
+---------------------------------------------------------
 >    14== M17718   1 D.melanogaster Rh3 <>[J.Neurosci.7,1550-1557'87]
-----------MES--GNV-----------SSSLFGNVSTAL----------RPEA-----
--------------RLSA------ETRLL----------GWNVPPEELR--HIPEHWLTYP
-E--------PPESMNYLLGTLYIFFTLMSMLGNGLVIWVFSAAKSLRTPSNILVINLAFC
-DFMMMVK--TPIFIYNSFH-QGYA--LGHLGCQIFGIIGSYTGIAAGATNAFIAYDRFNV
-ITRPMEG--KMTHGKAIAMIIFIYMYATPW-VVACYTETW-----GRFVPEGYLTSCTFD
-YLT--DNFDTRLFVACIFFFSFVCPTTMITYYYSQIVGHVFSHEKA--------------
-------------------------------------------------------LRDQAK
-KMN---------------VESLRS------------------------------------
--------------------NVDKNKET------AEIRIAKAAITICFLFFCSWTPYGVMS
-LIGAF-GDKT--LLTPGATMIPACACKMVACIDPFVYAISHPRYRMELQKRCPWLAL---
----NE-KAPES----SAVASTSTTQEPQQTTAA---------------------------
-------------------------------------------------------------
---
+----------MESGNVSS------------SLFGNVST-ALRP----------------E
+ARLS--A----------ETRLLGWNVPPEELR--------HIPEHWLTYPEPPESMNYLL
+GTLYIFFTLMSMLGNGLVIWVFSAAKSLRTPSNILVINLAFCDFMMMVK--TPIFIYNSF
+H-QGYA--LGHLGCQIFGIIGSYTGIAAGATNAFIAYDRFNVITRPMEG--KMTHGKAIA
+MIIFIYMYATPW-VVACYTETW-----GRFVPEGYLTSCTFDYLT--DNFDTRLFVACIF
+FFSFVCPTTMITYYYSQIVGHVFSHEKALRDQAKK-------------------------
+--------------------------------------------------MN--------
+--VESL------------------------------------------------------
+----------RSNVDKNKET------AEIRIAKAAITICFLFFCSWTPYGVMSLIGAF-G
+DKT--LLTPGATMIPACACKMVACIDPFVYAISHPRYRMELQKRCPWLAL---------N
+EKAP--ESSAVASTSTTQEP--QQTTAA--------------------------------
+---------------------------------------------------------
 >    15== X65879   1 Drosophila pseudoobscura Dpse\Rh3 <>[Genetics132(1),193-204'92
-----------MEY--HNV-----------SSVL-GNVSSVL----------RPDA-----
--------------RLSA------ESRLL----------GWNVPPDELR--HIPEHWLIYP
-E--------PPESMNYLLGTLYIFFTVISMIGNGLVMWVFSAAKSLRTPSNILVINLAFC
-DFMMMIK--TPIFIYNSFH-QGYA--LGHLGCQIFGVIGSYTGIAAGATNAFIAYDRYNV
-ITRPMEG--KMTHGKAIAMIIFIYLYATPW-VVACYTESW-----GRFVPEGYLTSCTFD
-YLT--DNFDTRLFVACIFFFSFVCPTTMITYYYSQIVGHVFSHEKA--------------
-------------------------------------------------------LRDQAK
-KMN---------------VDSLRS------------------------------------
--------------------NVDKSKEA------AEIRIAKAAITICFLFFASWTPYGVMS
-LIGAF-GDKT--LLTPGATMIPACTCKMVACIDPFVYAISHPRYRMELQKRCPWLAI---
----SE-KAPES----RAAISTSTTQEQQQTTAA---------------------------
-------------------------------------------------------------
---
+----------MEYHNVSS------------VL-GNVSS-VLRP----------------D
+ARLS--A----------ESRLLGWNVPPDELR--------HIPEHWLIYPEPPESMNYLL
+GTLYIFFTVISMIGNGLVMWVFSAAKSLRTPSNILVINLAFCDFMMMIK--TPIFIYNSF
+H-QGYA--LGHLGCQIFGVIGSYTGIAAGATNAFIAYDRYNVITRPMEG--KMTHGKAIA
+MIIFIYLYATPW-VVACYTESW-----GRFVPEGYLTSCTFDYLT--DNFDTRLFVACIF
+FFSFVCPTTMITYYYSQIVGHVFSHEKALRDQAKK-------------------------
+--------------------------------------------------MN--------
+--VDSL------------------------------------------------------
+----------RSNVDKSKEA------AEIRIAKAAITICFLFFASWTPYGVMSLIGAF-G
+DKT--LLTPGATMIPACTCKMVACIDPFVYAISHPRYRMELQKRCPWLAI---------S
+EKAP--ESRAAISTSTTQEQ--QQTTAA--------------------------------
+---------------------------------------------------------
 >    16== M17730   1 D.melanogaster Rh4 opsin <>[J.Neurosci.7,1558-1566'87]
-----------ME-------------------PLCNASEPPL----------RPEA-----
--------------R-SSG---NGDLQFL----------GWNVPPDQIQ--YIPEHWLTQL
-E--------PPASMHYMLGVFYIFLFCASTVGNGMVIWIFSTSKSLRTPSNMFVLNLAVF
-DLIMCLK--APIF--NSFH-RGFAIYLGNTWCQIFASIGSYSGIGAGMTNAAIGYDRYNV
-ITKPMNR--NMTFTKAVIMNIIIWLYCTPW-VVLPLTQFW-----DRFVPEGYLTSCSFD
-YLS--DNFDTRLFVGTIFFFSFVCPTLMILYYYSQIVGHVFSHEKA--------------
-------------------------------------------------------LREQAK
-KMN---------------VESLRS------------------------------------
--------------------NVDKSKET------AEIRIAKAAITICFLFFVSWTPYGVMS
-LIGAF-GDKS--LLTQGATMIPACTCKLVACIDPFVYAISHPRYRLELQKRCPWLGV---
----NE-KSGEI----SSAQSTTTQEQ-QQTTAA---------------------------
-------------------------------------------------------------
---
+----------ME------------------PL-CNASEPPLRP----------------E
+AR-S--SG---N----GDLQFLGWNVPPDQIQ--------YIPEHWLTQLEPPASMHYML
+GVFYIFLFCASTVGNGMVIWIFSTSKSLRTPSNMFVLNLAVFDLIMCLK--APIF--NSF
+H-RGFAIYLGNTWCQIFASIGSYSGIGAGMTNAAIGYDRYNVITKPMNR--NMTFTKAVI
+MNIIIWLYCTPW-VVLPLTQFW-----DRFVPEGYLTSCSFDYLS--DNFDTRLFVGTIF
+FFSFVCPTLMILYYYSQIVGHVFSHEKALREQAKK-------------------------
+--------------------------------------------------MN--------
+--VESL------------------------------------------------------
+----------RSNVDKSKET------AEIRIAKAAITICFLFFVSWTPYGVMSLIGAF-G
+DKS--LLTQGATMIPACTCKLVACIDPFVYAISHPRYRLELQKRCPWLGV---------N
+EKSG--EISSAQST-TTQEQ--QQTTAA--------------------------------
+---------------------------------------------------------
 >    17== X65880   1 Drosophila pseudoobscura Dpse\Rh4 <>[Genetics132(1),193-204'92
-----------MD-------------------ALCNASEPPL----------RPEA-----
--------------RMSSG---SDELQFL----------GWNVPPDQIQ--YIPEHWLTQL
-E--------PPASMHYMLGVFYIFLFFASTLGNGMVIWIFSTSKSLRTPSNMFVLNLAVF
-DLIMCLK--APIFIYNSFH-RGFA--LGNTWCQIFASIGSYSGIGAGMTNAAIGYDRYNV
-ITKPMNR--NMTFTKAVIMNIIIWLYCTPW-VVLPLTQFW-----DRFVPEGYLTSCSFD
-YLS--DNFDTRLFVGTIFLFSFVVPTLMILYYYSQIVGHVFNHEKA--------------
-------------------------------------------------------LREQAK
-KMN---------------VESLRS------------------------------------
--------------------NVDKSKET------AEIRIAKAAITICFLFFVSWTPYGVMS
-LIGAF-GDKS--LLTPGATMIPACTCKLVACIEPFVYAISHPRYRMELQKRCPWLGV---
----NE-KSGEA----SSAQSTTTQEQTQQTSAA---------------------------
-------------------------------------------------------------
---
+----------MD------------------AL-CNASEPPLRP----------------E
+ARMS--SG---S----DELQFLGWNVPPDQIQ--------YIPEHWLTQLEPPASMHYML
+GVFYIFLFFASTLGNGMVIWIFSTSKSLRTPSNMFVLNLAVFDLIMCLK--APIFIYNSF
+H-RGFA--LGNTWCQIFASIGSYSGIGAGMTNAAIGYDRYNVITKPMNR--NMTFTKAVI
+MNIIIWLYCTPW-VVLPLTQFW-----DRFVPEGYLTSCSFDYLS--DNFDTRLFVGTIF
+LFSFVVPTLMILYYYSQIVGHVFNHEKALREQAKK-------------------------
+--------------------------------------------------MN--------
+--VESL------------------------------------------------------
+----------RSNVDKSKET------AEIRIAKAAITICFLFFVSWTPYGVMSLIGAF-G
+DKS--LLTPGATMIPACTCKLVACIEPFVYAISHPRYRMELQKRCPWLGV---------N
+EKSG--EASSAQST-TTQEQ-TQQTSAA--------------------------------
+---------------------------------------------------------
 >    18== D50584   1 Hemigrapsus sanguineus opsin BcRh2 <compound eye>[J.Exp.Biol.1
---------------------------------MTNATGPQM----------AYYG-----
--------------AASMD-FGYPEGVSI----------VDFVRPEIKP--YVHQHWYNYP
-P--------VNPMWHYLLGVIYLFLGTVSIFGNGLVIYLFNKSAALRTPANILVVNLALS
-DLIMLTTN-VPFFTYNCFSGGVWM--FSPQYCEIYACLGAITGVCSIWLLCMISFDRYNI
-ICNGFNG-PKLTTGKAVVFALISWVIAIGC-ALPPFFG-W-----GNYILEGILDSCSYD
-YLT--QDFNTFSYNIFIFVFDYFLPAAIIVFSYVFIVKAIFAHEAA--------------
-------------------------------------------------------MRAQAK
-KMN---------------VSTLRS------------------------------------
---------------------NEADAQR------AEIRIAKTALVNVSLWFICWTPYALIS
-LKGVM-GDTS--GITPLVSTLPALLAKSCSCYNPFVYAISHPKYRLAITQHLPWFCV---
----HE-TETKS-NDDSQSNSTVAQDKA---------------------------------
-------------------------------------------------------------
---
+--------------------------------MTNATGPQMAY----------------Y
+GAAS--MD-FGY----PEGVSIVDFVRPEIKP--------YVHQHWYNYPPVNPMWHYLL
+GVIYLFLGTVSIFGNGLVIYLFNKSAALRTPANILVVNLALSDLIMLTTN-VPFFTYNCF
+SGGVWM--FSPQYCEIYACLGAITGVCSIWLLCMISFDRYNIICNGFNG-PKLTTGKAVV
+FALISWVIAIGC-ALPPFFG-W-----GNYILEGILDSCSYDYLT--QDFNTFSYNIFIF
+VFDYFLPAAIIVFSYVFIVKAIFAHEAAMRAQAKK-------------------------
+--------------------------------------------------MN--------
+--VSTL------------------------------------------------------
+----------RS-NEADAQR------AEIRIAKTALVNVSLWFICWTPYALISLKGVM-G
+DTS--GITPLVSTLPALLAKSCSCYNPFVYAISHPKYRLAITQHLPWFCV------HE-T
+ETKS--NDDSQSNSTVAQDK-A--------------------------------------
+---------------------------------------------------------
 >    19== D50583   1 Hemigrapsus sanguineus opsin BcRh1 <compound eye>[J.Exp.Biol.1
---------------------------------MANVTGPQM----------AFYG-----
--------------SGAAT-FGYPEGMTV----------ADFVPDRVKH--MVLDHWYNYP
-P--------VNPMWHYLLGVVYLFLGVISIAGNGLVIYLYMKSQALKTPANMLIVNLALS
-DLIMLTTN-FPPFCYNCFSGGRWM--FSGTYCEIYAALGAITGVCSIWTLCMISFDRYNI
-ICNGFNG-PKLTQGKATFMCGLAWVISVGW-SLPPFFG-W-----GSYTLEGILDSCSYD
-YFT--RDMNTITYNICIFIFDFFLPASVIVFSYVFIVKAIFAHEAA--------------
-------------------------------------------------------MRAQAK
-KMN---------------VTNLRS------------------------------------
---------------------NEAETQR------AEIRIAKTALVNVSLWFICWTPYAAIT
-IQGLL-GNAE--GITPLLTTLPALLAKSCSCYNPFVYAISHPKFRLAITQHLPWFCV---
----HE-KDPND-VEENQSSNTQTQEKS---------------------------------
-------------------------------------------------------------
---
+--------------------------------MANVTGPQMAF----------------Y
+GSGA--AT-FGY----PEGMTVADFVPDRVKH--------MVLDHWYNYPPVNPMWHYLL
+GVVYLFLGVISIAGNGLVIYLYMKSQALKTPANMLIVNLALSDLIMLTTN-FPPFCYNCF
+SGGRWM--FSGTYCEIYAALGAITGVCSIWTLCMISFDRYNIICNGFNG-PKLTQGKATF
+MCGLAWVISVGW-SLPPFFG-W-----GSYTLEGILDSCSYDYFT--RDMNTITYNICIF
+IFDFFLPASVIVFSYVFIVKAIFAHEAAMRAQAKK-------------------------
+--------------------------------------------------MN--------
+--VTNL------------------------------------------------------
+----------RS-NEAETQR------AEIRIAKTALVNVSLWFICWTPYAAITIQGLL-G
+NAE--GITPLLTTLPALLAKSCSCYNPFVYAISHPKFRLAITQHLPWFCV------HE-K
+DPND--VEENQSSNTQTQEK-S--------------------------------------
+---------------------------------------------------------
 >    20== K02320   1 D.melanogaster opsin <>[Cell40,851-858'85]
----------------MES-----------FAVAAAQLGPHF----------APLS-----
-------------------------NGSV----------VDKVTPDMAH--LISPYWNQFP
-A--------MDPIWAKILTAYMIMIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAIS
-DFGIMITN-TPMMGINLYF-ETWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQV
-IVKGMAG-RPMTIPLALGKM---------------------------YVPEGNLTSCGID
-YLE--RDWNPRSYLIFYSIFVYYIPLFLICYSYWFIIAAVSAHEKA--------------
-------------------------------------------------------MREQAK
-KMN---------------VKSLRS------------------------------------
---------------------SEDAEKS------AEGKLAKVALVTITLWFMAWTPYLVIN
-CMGLF-KF-E--GLTPLNTIWGACFAKSAACYNPIVYGISHPKYRLALKEKCPCCVF---
----GK-VDDGK-SSDAQSQATASEAESKA-------------------------------
-------------------------------------------------------------
---
+----------ME----SF------------AVAAAQLGPHFAP----------------L
+S-----------------NGSVVDKVTPDMAH--------LISPYWNQFPAMDPIWAKIL
+TAYMIMIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAISDFGIMITN-TPMMGINLY
+F-ETWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQVIVKGMAG-RPMTIPLALG
+KM---------------------------YVPEGNLTSCGIDYLE--RDWNPRSYLIFYS
+IFVYYIPLFLICYSYWFIIAAVSAHEKAMREQAKK-------------------------
+--------------------------------------------------MN--------
+--VKSL------------------------------------------------------
+----------RS-SEDAEKS------AEGKLAKVALVTITLWFMAWTPYLVINCMGLF-K
+F-E--GLTPLNTIWGACFAKSAACYNPIVYGISHPKYRLALKEKCPCCVF------GK-V
+DDGK--SSDAQSQA-TASEA-ESKA-----------------------------------
+---------------------------------------------------------
 >    21== K02315   1 D.melanogaster ninaE <>[Cell40,839-850'85]
----------------MES-----------FAVAAAQLGPHF----------APLS-----
-------------------------NGSV----------VDKVTPDMAH--LISPYWNQFP
-A--------MDPIWAKILTAYMIMIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAIS
-DFGIMITN-TPMMGINLYF-ETWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQV
-IVKGMAG-RPMTIPLALGKIAYIWFMSSIW-CLAPAFG-W-----SRYVPEGNLTSCGID
-YLE--RDWNPRSYLIFYSIFVYYIPLFLICYSYWFIIAAVSAHEKA--------------
-------------------------------------------------------MREQAK
-KMN---------------VKSLRS------------------------------------
---------------------SEDAEKS------AEGKLAKVALVTITLWFMAWTPYLVIN
-CMGLF-KF-E--GLTPLNTIWGACFAKSAACYNPIVYGISHPKYRLALKEKCPCCVF---
----GK-VDDGK-SSDAQSQATASEAESKA-------------------------------
-------------------------------------------------------------
---
+----------ME----SF------------AVAAAQLGPHFAP----------------L
+S-----------------NGSVVDKVTPDMAH--------LISPYWNQFPAMDPIWAKIL
+TAYMIMIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAISDFGIMITN-TPMMGINLY
+F-ETWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQVIVKGMAG-RPMTIPLALG
+KIAYIWFMSSIW-CLAPAFG-W-----SRYVPEGNLTSCGIDYLE--RDWNPRSYLIFYS
+IFVYYIPLFLICYSYWFIIAAVSAHEKAMREQAKK-------------------------
+--------------------------------------------------MN--------
+--VKSL------------------------------------------------------
+----------RS-SEDAEKS------AEGKLAKVALVTITLWFMAWTPYLVINCMGLF-K
+F-E--GLTPLNTIWGACFAKSAACYNPIVYGISHPKYRLALKEKCPCCVF------GK-V
+DDGK--SSDAQSQA-TASEA-ESKA-----------------------------------
+---------------------------------------------------------
 >    22== X65877   1 Drosophila pseudoobscura Dpse\ninaE <>[Genetics132(1),193-204'
----------------MDS-----------FAAVATQLGPQF----------AAPS-----
-------------------------NGSV----------VDKVTPDMAH--LISPYWDQFP
-A--------MDPIWAKILTAYMIIIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAIS
-DFGIMITN-TPMMGINLYF-ETWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQV
-IVKGMAG-RPMTIPLALGKIAYIWFMSTIWCCLAPVFG-W-----SRYVPEGNLTSCGID
-YLE--RDWNPRSYLIFYSIFVYYIPLFLICYSYWFIIAAVSAHEKA--------------
-------------------------------------------------------MREQAK
-KMN---------------VKSLRS------------------------------------
---------------------SEDADKS------AEGKLAKVALVTISLWFMAWTPYLVIN
-CMGLF-KF-E--GLTPLNTIWGACFAKSAACYNPIVYGISHPKYRLALKEKCPCCVF---
----GK-VDDGK-SSEAQSQATTSEAESKA-------------------------------
-------------------------------------------------------------
---
+----------MD----SF------------AAVATQLGPQFAA----------------P
+S-----------------NGSVVDKVTPDMAH--------LISPYWDQFPAMDPIWAKIL
+TAYMIIIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAISDFGIMITN-TPMMGINLY
+F-ETWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQVIVKGMAG-RPMTIPLALG
+KIAYIWFMSTIWCCLAPVFG-W-----SRYVPEGNLTSCGIDYLE--RDWNPRSYLIFYS
+IFVYYIPLFLICYSYWFIIAAVSAHEKAMREQAKK-------------------------
+--------------------------------------------------MN--------
+--VKSL------------------------------------------------------
+----------RS-SEDADKS------AEGKLAKVALVTISLWFMAWTPYLVINCMGLF-K
+F-E--GLTPLNTIWGACFAKSAACYNPIVYGISHPKYRLALKEKCPCCVF------GK-V
+DDGK--SSEAQSQA-TTSEA-ESKA-----------------------------------
+---------------------------------------------------------
 >    23== M12896   1 D.melanogaster Rh2 <>[Cell44,705-710'86]
-----------MERSHLPE-----------TPFDLAHSGPRF----------QAQS-----
--------------SG---------NGSV----------LDNVLPDMAH--LVNPYWSRFA
-P--------MDPMMSKILGLFTLAIMIISCCGNGVVVYIFGGTKSLRTPANLLVLNLAFS
-DFCMMASQ-SPVMIINFYY-ETWV--LGPLWCDIYAGCGSLFGCVSIWSMCMIAFDRYNV
-IVKGING-TPMTIKTSIMKILFIWMMAVFW-TVMPLIG-W-----SAYVPEGNLTACSID
-YMT--RMWNPRSYLITYSLFVYYTPLFLICYSYWFIIAAVAAHEKA--------------
-------------------------------------------------------MREQAK
-KMN---------------VKSLRS------------------------------------
---------------------SEDCDKS------AEGKLAKVALTTISLWFMAWTPYLVIC
-YFGLF-KI-D--GLTPLTTIWGATFAKTSAVYNPIVYGISHPKYRIVLKEKCPMCVF---
----GN-TDEPKPDAPASDTETTSEADSKA-------------------------------
-------------------------------------------------------------
---
+-----MERSHLP----ET------------PFDLAHSGPRFQA----------------Q
+SSG---------------NGSVLDNVLPDMAH--------LVNPYWSRFAPMDPMMSKIL
+GLFTLAIMIISCCGNGVVVYIFGGTKSLRTPANLLVLNLAFSDFCMMASQ-SPVMIINFY
+Y-ETWV--LGPLWCDIYAGCGSLFGCVSIWSMCMIAFDRYNVIVKGING-TPMTIKTSIM
+KILFIWMMAVFW-TVMPLIG-W-----SAYVPEGNLTACSIDYMT--RMWNPRSYLITYS
+LFVYYTPLFLICYSYWFIIAAVAAHEKAMREQAKK-------------------------
+--------------------------------------------------MN--------
+--VKSL------------------------------------------------------
+----------RS-SEDCDKS------AEGKLAKVALTTISLWFMAWTPYLVICYFGLF-K
+I-D--GLTPLTTIWGATFAKTSAVYNPIVYGISHPKYRIVLKEKCPMCVF------GN-T
+DEPK--PDAPASDTETTSEA-DSKA-----------------------------------
+---------------------------------------------------------
 >    24== X65878   1 Drosophila pseudoobscura Dpse\Rh2 <>[Genetics132(1),193-204'92
-----------MERSLLPE-----------PPLAMALLGPRF----------EAQT-----
--------------GG---------NRSV----------LDNVLPDMAP--LVNPHWSRFA
-P--------MDPTMSKILGLFTLVILIISCCGNGVVVYIFGGTKSLRTPANLLVLNLAFS
-DFCMMASQ-SPVMIINFYY-ETWV--LGPLWCDIYAACGSLFGCVSIWSMCMIAFDRYNV
-IVKGING-TPMTIKTSIMKIAFIWMMAVFW-TIMPLIG-W-----SSYVPEGNLTACSID
-YMT--RQWNPRSYLITYSLFVYYTPLFMICYSYWFIIATVAAHEKA--------------
-------------------------------------------------------MRDQAK
-KMN---------------VKSLRS------------------------------------
---------------------SEDCDKS------AENKLAKVALTTISLWFMAWTPYLIIC
-YFGLF-KI-D--GLTPLTTIWGATFAKTSAVYNPIVYGISHPNDRLVLKEKCPMCVC---
----GT-TDEPKPDAPPSDTETTSEAESKD-------------------------------
-------------------------------------------------------------
---
+-----MERSLLP----EP------------PLAMALLGPRFEA----------------Q
+TGG---------------NRSVLDNVLPDMAP--------LVNPHWSRFAPMDPTMSKIL
+GLFTLVILIISCCGNGVVVYIFGGTKSLRTPANLLVLNLAFSDFCMMASQ-SPVMIINFY
+Y-ETWV--LGPLWCDIYAACGSLFGCVSIWSMCMIAFDRYNVIVKGING-TPMTIKTSIM
+KIAFIWMMAVFW-TIMPLIG-W-----SSYVPEGNLTACSIDYMT--RQWNPRSYLITYS
+LFVYYTPLFMICYSYWFIIATVAAHEKAMRDQAKK-------------------------
+--------------------------------------------------MN--------
+--VKSL------------------------------------------------------
+----------RS-SEDCDKS------AENKLAKVALTTISLWFMAWTPYLIICYFGLF-K
+I-D--GLTPLTTIWGATFAKTSAVYNPIVYGISHPNDRLVLKEKCPMCVC------GT-T
+DEPK--PDAPPSDTETTSEA-ESKD-----------------------------------
+---------------------------------------------------------
 >    25== U26026   1 Apis mellifera long-wavelength rhodopsin <>[]
---------------------------------MIAVSGPSY----------EAFS-----
--------------YGGQARF---NNQTV----------VDKVPPDMLH--LIDANWYQYP
-P--------LNPMWHGILGFVIGMLGFVSAMGNGMVVYIFLSTKSLRTPSNLFVINLAIS
-NFLMMFCM-SPPMVINCYY-ETWV--LGPLFCQIYAMLGSLFGCGSIWTMTMIAFDRYNV
-IVKGLSG-KPLSINGALIRIIAIWLFSLGW-TIAPMFG-W-----NRYVPEGNMTACGTD
-YFN--RGLLSASYLVCYGIWVYFVPLFLIIYSYWFIIQAVAAHEKN--------------
-------------------------------------------------------MREQAK
-KMN---------------VASLRS------------------------------------
---------------------SENQNTS------AECKLAKVALMTISLWFMAWTPYLVIN
-FSGIF-NL-V--KISPLFTIWGSLFAKANAVYNPIVYGISHPKYRAALFAKFPSLAC---
-----A-AEPSS-DAVSTTSGTTTVTDNEKSNA----------------------------
-------------------------------------------------------------
---
+--------------------------------MIAVSGPSYEA----------------F
+SYGG--QARF-------NNQTVVDKVPPDMLH--------LIDANWYQYPPLNPMWHGIL
+GFVIGMLGFVSAMGNGMVVYIFLSTKSLRTPSNLFVINLAISNFLMMFCM-SPPMVINCY
+Y-ETWV--LGPLFCQIYAMLGSLFGCGSIWTMTMIAFDRYNVIVKGLSG-KPLSINGALI
+RIIAIWLFSLGW-TIAPMFG-W-----NRYVPEGNMTACGTDYFN--RGLLSASYLVCYG
+IWVYFVPLFLIIYSYWFIIQAVAAHEKNMREQAKK-------------------------
+--------------------------------------------------MN--------
+--VASL------------------------------------------------------
+----------RS-SENQNTS------AECKLAKVALMTISLWFMAWTPYLVINFSGIF-N
+L-V--KISPLFTIWGSLFAKANAVYNPIVYGISHPKYRAALFAKFPSLAC-------A-A
+EPSS--DAVSTTSGTTTVTD-NEKSNA---------------------------------
+---------------------------------------------------------
 >    26== L03781   1 Limulus polyphemus opsin <>[PNAS90,6150-6154'93]
-----------------------------------MANQLSY----------SSLG-----
--------------WPYQP------NASV----------VDTMPKEMLY--MIHEHWYAFP
-P--------MNPLWYSILGVAMIILGIICVLGNGMVIYLMMTTKSLRTPTNLLVVNLAFS
-DFCMMAFM-MPTMTSNCFA-ETWI--LGPFMCEVYGMAGSLFGCASIWSMVMITLDRYNV
-IVRGMAA-APLTHKKATLLLLFVWIWSGGW-TILPFFG-W-----SRYVPEGNLTSCTVD
-YLT--KDWSSASYVVIYGLAVYFLPLITMIYCYFFIVHAVAEHEKQ--------------
-------------------------------------------------------LREQAK
-KMN---------------VASLRA------------------------------------
--------------------NADQQKQS------AECRLAKVAMMTVGLWFMAWTPYLIIS
-WAGVF-SSGT--RLTPLATIWGSVFAKANSCYNPIVYGISHPRYKAALYQRFPSLAC---
----GS-GESGS-DVKSEASATTTMEEKPKIPEA---------------------------
-------------------------------------------------------------
---
+----------------------------------MANQLSYSS----------------L
+GWPY--QP----------NASVVDTMPKEMLY--------MIHEHWYAFPPMNPLWYSIL
+GVAMIILGIICVLGNGMVIYLMMTTKSLRTPTNLLVVNLAFSDFCMMAFM-MPTMTSNCF
+A-ETWI--LGPFMCEVYGMAGSLFGCASIWSMVMITLDRYNVIVRGMAA-APLTHKKATL
+LLLFVWIWSGGW-TILPFFG-W-----SRYVPEGNLTSCTVDYLT--KDWSSASYVVIYG
+LAVYFLPLITMIYCYFFIVHAVAEHEKQLREQAKK-------------------------
+--------------------------------------------------MN--------
+--VASL------------------------------------------------------
+----------RANADQQKQS------AECRLAKVAMMTVGLWFMAWTPYLIISWAGVF-S
+SGT--RLTPLATIWGSVFAKANSCYNPIVYGISHPRYKAALYQRFPSLAC------GS-G
+ESGS--DVKSEASATTTMEE-KPKIPEA--------------------------------
+---------------------------------------------------------
 >    27== X07797   1 Octopus dofleini rhodopsin <>[FEBS232(1),69-72'88]
----------------------------------------MV----------ESTT-----
--------------LVNQT-WWY--NPTV----------D------------IHPHWAKFD
-P--------IPDAVYYSVGIFIGVVGIIGILGNGVVIYLFSKTKSLQTPANMFIINLAMS
-DLSFSAINGFPLKTISAFM-KKWI--FGKVACQLYGLLGGIFGFMSINTMAMISIDRYNV
-IGRPMAASKKMSHRRAFLMIIFVWMWSIVW-SVGPVFN-W-----GAYVPEGILTSCSFD
-YLS--TDPSTRSFILCMYFCGFMLPIIIIAFCYFNIVMSVSNHEKE--------------
-------------------------------------------------------MAAMAK
-RLN---------------AKELR-------------------------------------
---------------------KAQAGAS------AEMKLAKISMVIITQFMLSWSPYAIIA
-LLAQF-GPAE--WVTPYAAELPVLFAKASAIHNPIVYSVSHPKFREAIQTTFPWLLTCCQ
-FDEKE-CEDAN-DAEEEVVASER--GGESRDAAQMKEMMAMMQKMQAQQAAYQPPPPPQG
-Y--PPQGYPPQGAYPPPQGYPPQGYPPQGYPPQGYPPQGAPPQVEAPQGAPPQGVDNQAY
-QA
+---------------------------------------MVES----------------T
+TLVN--QT-WWY------NPTVD------------------IHPHWAKFDPIPDAVYYSV
+GIFIGVVGIIGILGNGVVIYLFSKTKSLQTPANMFIINLAMSDLSFSAINGFPLKTISAF
+M-KKWI--FGKVACQLYGLLGGIFGFMSINTMAMISIDRYNVIGRPMAASKKMSHRRAFL
+MIIFVWMWSIVW-SVGPVFN-W-----GAYVPEGILTSCSFDYLS--TDPSTRSFILCMY
+FCGFMLPIIIIAFCYFNIVMSVSNHEKEMAAMAKR-------------------------
+--------------------------------------------------LN--------
+--AKEL------------------------------------------------------
+----------R--KAQAGAS------AEMKLAKISMVIITQFMLSWSPYAIIALLAQF-G
+PAE--WVTPYAAELPVLFAKASAIHNPIVYSVSHPKFREAIQTTFPWLLTCCQFDEKE-C
+EDAN--DAEEEVVASER--G-GESRDAAQMKEMMAMMQKMQAQQAAYQPPPPPQGY--PP
+QGYPPQGAYPPPQGYPPQGYPPQGYPPQGYPPQGAPPQVEAPQGAPPQGVDNQAYQA
 >    28== X70498   1 Todarodes pacificus rhodopsin <retina>[FEBS317(1-2),5-11'93]
-----------------------------------------M----------GRDL-----
--------------RDNET-WWY--NPSI----------V------------VHPHWREFD
-Q--------VPDAVYYSLGIFIGICGIIGCGGNGIVIYLFTKTKSLQTPANMFIINLAFS
-DFTFSLVNGFPLMTISCFL-KKWI--FGFAACKVYGFIGGIFGFMSIMTMAMISIDRYNV
-IGRPMAASKKMSHRRAFIMIIFVWLWSVLW-AIGPIFG-W-----GAYTLEGVLCNCSFD
-YIS--RDSTTRSNILCMFILGFFGPILIIFFCYFNIVMSVSNHEKE--------------
-------------------------------------------------------MAAMAK
-RLN---------------AKELR-------------------------------------
---------------------KAQAGAN------AEMRLAKISIVIVSQFLLSWSPYAVVA
-LLAQF-GPLE--WVTPYAAQLPVMFAKASAIHNPMIYSVSHPKFREAISQTFPWVLTCCQ
-FDDKE-TEDDK-DAETEIPAGESSDAAPSADAAQMKEMMAMMQKMQQQQAAY----PPQG
-YAPPPQGYPPQGY--PPQGYPPQGYPPQGYPP---PPQGAPPQ-GAPPAAPPQGVDNQAY
-QA
+----------------------------------------MGR----------------D
+LRDN--ET-WWY------NPSIV------------------VHPHWREFDQVPDAVYYSL
+GIFIGICGIIGCGGNGIVIYLFTKTKSLQTPANMFIINLAFSDFTFSLVNGFPLMTISCF
+L-KKWI--FGFAACKVYGFIGGIFGFMSIMTMAMISIDRYNVIGRPMAASKKMSHRRAFI
+MIIFVWLWSVLW-AIGPIFG-W-----GAYTLEGVLCNCSFDYIS--RDSTTRSNILCMF
+ILGFFGPILIIFFCYFNIVMSVSNHEKEMAAMAKR-------------------------
+--------------------------------------------------LN--------
+--AKEL------------------------------------------------------
+----------R--KAQAGAN------AEMRLAKISIVIVSQFLLSWSPYAVVALLAQF-G
+PLE--WVTPYAAQLPVMFAKASAIHNPMIYSVSHPKFREAISQTFPWVLTCCQFDDKE-T
+EDDK--DAETEIPAGESSDA-APSADAAQMKEMMAMMQKMQQQQAAY----PPQGYAPPP
+QGYPPQGY--PPQGYPPQGYPPQGYPP---PPQGAPPQ-GAPPAAPPQGVDNQAYQA
 >    29== L21195   1 human serotonin 5-HT7 receptor protein <placenta and fetal bra
----------MMDVNSSGRPDLYGHLRSF-LLPEVGRGLPDL----------SPDGGADPV
-AGSWAPHLLS---EVTAS-----PAPTW------------DAPPDNAS--GCGEQIN---
----------YGRVEKVVIGSILTLITLLTIAGNCLVVISVCFVKKLRQPSNYLIVSLALA
-DLSVAVAV-MPFVSVTDLIGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYLG
-ITRPLTYPVRQNGKCMAKMILSVWLLSASI-TLPPLFG-W-----AQNVNDDKVCLISQD
-F----------GYTIYSTAVAFYIPMSVMLFMYYQIYKAARKSAAKHKF-----------
---------------------------------------------P----GFPRVEPDSVI
-ALNG--------------IVKLQ----------------------KEVEECANLSR----
---------------LLKHERKNISIFK------REQKAATTLGIIVGAFTVCWLPFFLLS
-TARPFICGTSCSCIPLWVERTFLWLGYANSLINPFIYAFFNRDLRTTYRSLLQC------
----QY-RNINR--KLSAAGMHEALKLAER-------------------------------
------------------------------------PERPEFVL-QNADYCRKKGHDS---
---
+---------MMDVNSSGRPDLYGHLRSFL-LPEVGRGLPDLSPDGGA------------D
+PVAGSWAPHLLS------EVTASPAPTWDAPPDNASGCGEQIN--------YGRVEKVVI
+GSILTLITLLTIAGNCLVVISVCFVKKLRQPSNYLIVSLALADLSVAVAV-MPFVSVTDL
+IGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYLGITRPLTYPVRQNGKCMAK
+MILSVWLLSASI-TLPPLFG-W-----AQNVNDDKVCLISQDF----------GYTIYST
+AVAFYIPMSVMLFMYYQIY-------KAARKSAAKHKF----------------------
+---------------------------------PGFPRV----EPDSVIALNG-------
+--IVKL----------------------QK---------EVEECAN--------------
+----LSRLLKHERKNISIFK------REQKAATTLGIIVGAFTVCWLPFFLLSTARPFIC
+GTSCSCIPLWVERTFLWLGYANSLINPFIYAFFNRDLRTTYRSLLQCQYR----NINR--
+------KLSAAGMHEALKLAERPERPEF------------VLQNADY-------------
+--------------------------------------------CRKKGHDS-----
 >    30== L15228   1 rat 5HT-7 serotonin receptor <>[JBC268,18200-18204'93]
 ------------------------------------------------------------
-----MPHLLSGFLEVTAS-----PAPTW------------DAPPDNVS--GCGEQIN---
----------YGRVEKVVIGSILTLITLLTIAGNCLVVISVSFVKKLRQPSNYLIVSLALA
-DLSVAVAV-MPFVSVTDLIGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYLG
-ITRPLTYPVRQNGKCMAKMILSVWLLSASI-TLPPLFG-W-----AQNVNDDKVCLISQD
-F----------GYTIYSTAVAFYIPMSVMLFMYYQIYKAARKSAAKHKF-----------
---------------------------------------------P----GFPRVQPESVI
-SLNG--------------VVKLQ----------------------KEVEECANLSR----
---------------LLKHERKNISIFK------REQKAATTLGIIVGAFTVCWLPFFLLS
-TARPFICGTSCSCIPLWVERTCLWLGYANSLINPFIYAFFNRDLRPTSRSLLQC------
----QY-RNINR--KLSAAGMHEALKLAER-------------------------------
------------------------------------PERSEFVL-QNSDHCGKKGHDT---
---
+------MPHLLS---GFLEVTASPAPTWDAPPDNVSGCGEQIN--------YGRVEKVVI
+GSILTLITLLTIAGNCLVVISVSFVKKLRQPSNYLIVSLALADLSVAVAV-MPFVSVTDL
+IGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYLGITRPLTYPVRQNGKCMAK
+MILSVWLLSASI-TLPPLFG-W-----AQNVNDDKVCLISQDF----------GYTIYST
+AVAFYIPMSVMLFMYYQIY-------KAARKSAAKHKF----------------------
+---------------------------------PGFPRV----QPESVISLNG-------
+--VVKL----------------------QK---------EVEECAN--------------
+----LSRLLKHERKNISIFK------REQKAATTLGIIVGAFTVCWLPFFLLSTARPFIC
+GTSCSCIPLWVERTCLWLGYANSLINPFIYAFFNRDLRPTSRSLLQCQYR----NINR--
+------KLSAAGMHEALKLAERPERSEF------------VLQNSDH-------------
+--------------------------------------------CGKKGHDT-----
 >    31=p A47425 serotonin receptor 5HT-7 - rat
 ------------------------------------------------------------
-----MPHLLSGFLEVTAS-----PAPTW------------DAPPDNVS--GCGEQIN---
----------YGRVEKVVIGSILTLITLLTIAGNCLVVISVSFVKKLRQPSNYLIVSLALA
-DLSVAVAV-MPFVSVTDLIGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYLG
-ITRPLTYPVRQNGKCMAKMILSVWLLSASI-TLPPLFG-W-----AQNVNDDKVCLISQD
-F----------GYTIYSTAVAFYIPMSVMLFMYYQIYKAARKSAAKHKF-----------
---------------------------------------------P----GFPRVQPESVI
-SLNG--------------VVKLQ----------------------KEVEECANLSR----
---------------LLKHERKNISIFK------REQKAATTLGIIVGAFTVCWLPFFLLS
-TARPFICGTSCSCIPLWVERTCLWLGYANSLINPFIYAFFNRDLRTTYRSLLQC------
----QY-RNINR--KLSAAGMHEALKLAER-------------------------------
------------------------------------PERSEFVL-QNSDHCGKKGHDT---
---
+------MPHLLS---GFLEVTASPAPTWDAPPDNVSGCGEQIN--------YGRVEKVVI
+GSILTLITLLTIAGNCLVVISVSFVKKLRQPSNYLIVSLALADLSVAVAV-MPFVSVTDL
+IGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYLGITRPLTYPVRQNGKCMAK
+MILSVWLLSASI-TLPPLFG-W-----AQNVNDDKVCLISQDF----------GYTIYST
+AVAFYIPMSVMLFMYYQIY-------KAARKSAAKHKF----------------------
+---------------------------------PGFPRV----QPESVISLNG-------
+--VVKL----------------------QK---------EVEECAN--------------
+----LSRLLKHERKNISIFK------REQKAATTLGIIVGAFTVCWLPFFLLSTARPFIC
+GTSCSCIPLWVERTCLWLGYANSLINPFIYAFFNRDLRTTYRSLLQCQYR----NINR--
+------KLSAAGMHEALKLAERPERSEF------------VLQNSDH-------------
+--------------------------------------------CGKKGHDT-----
 >    32== M83181   1 human serotonin receptor <>[JBC267(11),7553-7562'92]
-----------MDVLSPG------------QGNNTTSPPAPF----------ETGG-----
--------------NTTGI-----SDVTV--------------------------------
-------------SYQVITSLLLGTLIFCAVLGNACVVAAIALERSLQNVANYLIGSLAVT
-DLMVSVLV-LPMAALYQVL-NKWT--LGQVTCDLFIALDVLCCTSSILHLCAIALDRYWA
-ITDPIDYVNKRTPRRAAALISLTWLIGFLI-SIPPMLG-WRTPEDRSDPDA---CTISKD
-H----------GYTIYSTFGAFYIPLLLMLVLYGRIFRAARFRIRK--------------
--------------------------TVKKVEKTGADTRHGASPAP---------QPKKS-
--VNGESGSRNWRL-----GVESKAGGALCANGAVRQGDDGAALEVIEVHRVGNSKEHLPL
-PSEAG--PTPCAPASFERKNERNAEAKRKMALARERKTVKTLGIIMGTFILCWLPFFIVA
-LVLPF-CESSC-HMPTLLGAIINWLGYSNSLLNPVIYAYFNKDFQNAFKKIIKC------
----KF-CRQ---------------------------------------------------
+----------MDVLSP--------------------------------------------
+---------------GQGNNTTSPPAPFET-GGNTTGISDVT---------VSYQ--VIT
+SLLLGTLIFCAVLGNACVVAAIALERSLQNVANYLIGSLAVTDLMVSVLV-LPMAALYQV
+L-NKWT--LGQVTCDLFIALDVLCCTSSILHLCAIALDRYWAITDPIDYVNKRTPRRAAA
+LISLTWLIGFLI-SIPPMLG-WRTPEDRSDPD---ACTISKDH----------GYTIYST
+FGAFYIPLLLMLVLYGRIF-------RAARFRIRK-------------------------
+--------------TVKKVEKTGADTRHGASPAPQPKKS-----------VNGESGSR--
+-------NWRLGVESKAGGALCANGAVRQGDDGAALEVIEVHRVGNSKEHLPLPSEAG--
+PTPCAPASFERKNERNAEAKRKMALARERKTVKTLGIIMGTFILCWLPFFIVALVLPF-C
+ESSC-HMPTLLGAIINWLGYSNSLLNPVIYAYFNKDFQNAFKKIIKCKFC----RQ----
 ------------------------------------------------------------
---
+---------------------------------------------------------
 >    33=p A35181 serotonin receptor class 1A - rat
-----------MDVFSFG------------QGNNTTASQEPF----------GTGG-----
--------------NVTSI-----SDVTF--------------------------------
-------------SYQVITSLLLGTLIFCAVLGNACVVAAIALERSLQNVANYLIGSLAVT
-DLMVSVLV-LPMAALYQVL-NKWT--LGQVTCDLFIALDVLCCTSSILHLCAIALDRYWA
-ITDPIDYVNKRTPRRAAALISLTWLIGFLI-SIPPMLG-WRTPEDRSDPDA---CTISKD
-H----------GYTIYSTFGAFYIPLLLMLVLYGRIFRAARFRIRK--------------
--------------------------TVRKVEKKGAGTSLGTSSAP---------PPKKS-
--LNGQPGSGDWRR-----CAENRAVGTPCTNGAVRQGDDEATLEVIEVHRVGNSKEHLPL
-PSESG--SNSYAPACLERKNERNAEAKRKMALARERKTVKTLGIIMGTFILCWLPFFIVA
-LVLPF-CESSC-HMPALLGAIINWLGYSNSLLNPVIYAYFNKDFQNAFKKIIKC------
----KF-CRR---------------------------------------------------
+----------MDVFSF--------------------------------------------
+---------------GQGNNTTASQEPFGT-GGNVTSISDVT---------FSYQ--VIT
+SLLLGTLIFCAVLGNACVVAAIALERSLQNVANYLIGSLAVTDLMVSVLV-LPMAALYQV
+L-NKWT--LGQVTCDLFIALDVLCCTSSILHLCAIALDRYWAITDPIDYVNKRTPRRAAA
+LISLTWLIGFLI-SIPPMLG-WRTPEDRSDPD---ACTISKDH----------GYTIYST
+FGAFYIPLLLMLVLYGRIF-------RAARFRIRK-------------------------
+--------------TVRKVEKKGAGTSLGTSSAPPPKKS-----------LNGQPGSG--
+-------DWRRCAENRAVGTPCTNGAVRQGDDEATLEVIEVHRVGNSKEHLPLPSESG--
+SNSYAPACLERKNERNAEAKRKMALARERKTVKTLGIIMGTFILCWLPFFIVALVLPF-C
+ESSC-HMPALLGAIINWLGYSNSLLNPVIYAYFNKDFQNAFKKIIKCKFC----RR----
 ------------------------------------------------------------
---
+---------------------------------------------------------
 >    34== L06803   1 Lymnaea stagnalis serotonin receptor <>[PNAS90,11-15'93]
-MANFTFGDLALDVARMG-----GLASTPSGLRSTGLTTPGL----------SPTG-----
--------------LVTSD-----FNDSYGLTGQFINGSHSSRSRDNAS--ANDTSATNMT
-DDRYWSLTVYSHEHLVLTSVILGLFVLCCIIGNCFVIAAVMLERSLHNVANYLILSLAVA
-DLMVAVLV-MPLSVVSEIS-KVWF--LHSEVCDMWISVDVLCCTASILHLVAIAMDRYWA
-VTS-IDYIRRRSARRILLMIMVVWIVALFI-SIPPLFG-WRDP--NNDPDKTGTCIISQD
-K----------GYTIFSTVGAFYLPMLVMMIIYIRIWLVARSRIRKDKFQMTKARLKTEE
-TTLVASPKTEYSVVSDCNGCNSPDSTTEKKKRRAPFKSYGCSPRPERKKNRAKKLPENAN
-GVNSNSSS----------SERLKQIQIETAEAFANGCAEEASIAMLERQ-CNNGKKISSN
-DTPYS-------------RTREKLELK------RERKAARTLAIITGAFLICWLPFFIIA
-LIGPF-VDPE--GIPPFARSFVLWLGYFNSLLNPIIYTIFSPEFRSAFQKILFG------
----KY-RRGHR-------------------------------------------------
+MANFTFGDLALDVARMG-----GLASTPSGLRSTGLTTPGLSPTGLV------------T
+SDFN--DSYGLT---GQFINGSHSSRSRDNASANDTSATNMTDDRYWSLTVYSHEHLVLT
+SVILGLFVLCCIIGNCFVIAAVMLERSLHNVANYLILSLAVADLMVAVLV-MPLSVVSEI
+S-KVWF--LHSEVCDMWISVDVLCCTASILHLVAIAMDRYWAVTS-IDYIRRRSARRILL
+MIMVVWIVALFI-SIPPLFG-WRDP--NNDPDKTGTCIISQDK----------GYTIFST
+VGAFYLPMLVMMIIYIRIW-------LVARSRIRKDKFQMTKARLKTEETTLVASPKTEY
+SVVSDCNGCNSPDSTTEKKKRRAPFKSYGCSPRPERKKNRAKKLPENANGVNSNSSS---
+-------SERLKQIQIETAEAFANGCA----EEASIAMLERQ-CNNGKKISSNDTPYS--
+-----------RTREKLELK------RERKAARTLAIITGAFLICWLPFFIIALIGPF-V
+DPE--GIPPFARSFVLWLGYFNSLLNPIIYTIFSPEFRSAFQKILFGKYR----RGHR--
 ------------------------------------------------------------
---
+---------------------------------------------------------
 >    35=p A47174 serotonin receptor, 5HTlym receptor - great pond snail
-MANFTFGDLALDVARMG-----GLASTPSGLRSTGLTTPGL----------SPTG-----
--------------LVTSD-----FNDSYGLTGQFINGSHSSRSRDNAS--ANDTSATNMT
-DDRYWSLTVYSHEHLVLTSVILGLFVLCCIIGNCFVIAAVMLERSLHNVANYLILSLAVA
-DLMVAVLV-MPLSVVSEIS-KVWF--LHSEVCDMWISVDVLCCTASILHLVAIAMDRYWA
-VTS-IDYIRRRSARRILLMIMVVWIVALFI-SIPPLFG-WRDP--NNDPDKTGTCIISQD
-K----------GYTIFSTVGAFYLPMLVMMIIYIRIWLVARSRIRKDKFQMTKARLKTEE
-TTLVASPKTEYSVVSDCNGCNSPDSTTEKKKRRAPFKSYGCSPRPERKKNRAKKLPENAN
-GVNSNSSS----------SERLKQIQIETAEAFANGCAEEASIAMLERQ-CNNGKKISSN
-DTPYS-------------RTREKLELK------RERKAARTLAIITGAFLICWLPFFIIA
-LIGPF-VDPE--GIPPFARSFVLWLGYFNSLLNPIIYTIFSPEFRSAFQKILFG------
----KY-RRGHR-------------------------------------------------
+MANFTFGDLALDVARMG-----GLASTPSGLRSTGLTTPGLSPTGLV------------T
+SDFN--DSYGLT---GQFINGSHSSRSRDNASANDTSATNMTDDRYWSLTVYSHEHLVLT
+SVILGLFVLCCIIGNCFVIAAVMLERSLHNVANYLILSLAVADLMVAVLV-MPLSVVSEI
+S-KVWF--LHSEVCDMWISVDVLCCTASILHLVAIAMDRYWAVTS-IDYIRRRSARRILL
+MIMVVWIVALFI-SIPPLFG-WRDP--NNDPDKTGTCIISQDK----------GYTIFST
+VGAFYLPMLVMMIIYIRIW-------LVARSRIRKDKFQMTKARLKTEETTLVASPKTEY
+SVVSDCNGCNSPDSTTEKKKRRAPFKSYGCSPRPERKKNRAKKLPENANGVNSNSSS---
+-------SERLKQIQIETAEAFANGCA----EEASIAMLERQ-CNNGKKISSNDTPYS--
+-----------RTREKLELK------RERKAARTLAIITGAFLICWLPFFIIALIGPF-V
+DPE--GIPPFARSFVLWLGYFNSLLNPIIYTIFSPEFRSAFQKILFGKYR----RGHR--
 ------------------------------------------------------------
---
+---------------------------------------------------------
 >    36== X95604   1 Bombyx mori serotonin receptor <antennae>[InsectBiochem.Mol.Bi
--MEGAEGQEELDWEAL-------YLRLP--LQNCSWNSTGW----------EPNW-----
--------------NVTVV-----PNTTW---------WQASAPFDTPA--ALVRAAAK--
-------------------AVVLGLLILATVVGNVFVIAAILLERHLRSAANNLILSLAVA
-DLLVACLV-MPLGAVYEVV-QRWT--LGPELCDMWTSGDVLCCTASILHLVAIALDRYWA
-VTN-IDYIHASTAKRVGMMIACVWTVSFFV-CIAQLLG-WKDPDWNQRVSEDLRCVVSQD
-V----------GYQIFATASSFYVPVLIILILYWRIYQTARKRIR---------------
-------------------------------RRRGATARGGVGPPP---------VPAGGA
-LVAGGGSGGIAAAVVAVIGRPLPTISETTTTGFTNVSSNNTS---PEKQSCANGLEADPP
-TTGYGAVAAAYYPSLVRRKPKEAADSK------RERKAAKTLAIITGAFVACWLPFFVLA
-ILVPT-CDCE---VSPVLTSLSLWLGYFNSTLNPVIYTVFSPEFRHAFQRLLCG------
----RR-VRRRR--A----------------------------------------------
------------------------------------PQ-----------------------
---
+-MEGAEGQEELDWEAL-------YLRLP--LQNCSWNSTGWEPNWNV------------T
+VVPN--TTWW------------QASAPFDTPAALVRAAAK--------------------
+AVVLGLLILATVVGNVFVIAAILLERHLRSAANNLILSLAVADLLVACLV-MPLGAVYEV
+V-QRWT--LGPELCDMWTSGDVLCCTASILHLVAIALDRYWAVTN-IDYIHASTAKRVGM
+MIACVWTVSFFV-CIAQLLG-WKDPDWNQRVSEDLRCVVSQDV----------GYQIFAT
+ASSFYVPVLIILILYWRIY-------QTARKRIR--------------------------
+-------------------RRRGATARGGVGPPP---------VPAGGALVAGGGSGGIA
+AAVVAVIGRPLPTISETTTTGFTNVSS----NNTSP---EKQSCANGLEADPPTTGYGAV
+AAAYYPSLVRRKPKEAADSK------RERKAAKTLAIITGAFVACWLPFFVLAILVPT-C
+DCE---VSPVLTSLSLWLGYFNSTLNPVIYTVFSPEFRHAFQRLLCGRRV----RRRR--
+------A---------------PQ------------------------------------
+---------------------------------------------------------
--- a/test-data/mafft_nwns_result.aln	Sat Nov 11 15:06:34 2017 -0500
+++ b/test-data/mafft_nwns_result.aln	Wed Apr 15 15:33:37 2020 -0400
@@ -1,270 +1,270 @@
-CLUSTAL format alignment by MAFFT NW-NS-2 (v7.221)
+CLUSTAL format alignment by MAFFT NW-NS-2 (v7.455)
 
 
-1==             --------------------------------MNGTE--------------GDNF-----
-2==             --------------------------------MNGTE--------------GPNF-----
-3==             --------------------------------MNGTE--------------GINF-----
-4=p             --------------------------------MNGTE--------------GKNF-----
-5=p             --------------------------------MNGTE--------------GNNF-----
-6==             --------------------------------MKQVPEF------------HEDF-----
-7==             --------------------------------MRKMS--------------EEEF-----
+1==             ----------------------------------------MNG----------------T
+2==             ----------------------------------------MNG----------------T
+3==             ----------------------------------------MNG----------------T
+4=p             ----------------------------------------MNG----------------T
+5=p             ----------------------------------------MNG----------------T
+6==             ----------------------------------------MKQ----------------V
+7==             ----------------------------------------MRK----------------M
 8=opsin,        ------------------------------------------------------------
-9==             --------------------------------MAQQWSLQRLAGRHPQDSYEDST-----
-10==            --------------------------------MAQQWSLQRLAGRHPQDSYEDST-----
-11==            --------------------------------MTEAWNVAVFAARRSRDD-DDTT-----
-12==            --------------------------------MAA-WEAAFAARRRHEE--EDTT-----
-13==            --------------------------------MS-----------------SNSS-----
-14==            ----------MES--GNV-----------SSSLFGNVSTAL----------RPEA-----
-15==            ----------MEY--HNV-----------SSVL-GNVSSVL----------RPDA-----
-16==            ----------ME-------------------PLCNASEPPL----------RPEA-----
-17==            ----------MD-------------------ALCNASEPPL----------RPEA-----
-18==            --------------------------------MTNATGPQM----------AYYG-----
-19==            --------------------------------MANVTGPQM----------AFYG-----
-20==            ---------------MES-----------FAVAAAQLGPHF----------APLS-----
-21==            ---------------MES-----------FAVAAAQLGPHF----------APLS-----
-22==            ---------------MDS-----------FAAVATQLGPQF----------AAPS-----
-23==            ----------MERSHLPE-----------TPFDLAHSGPRF----------QAQS-----
-24==            ----------MERSLLPE-----------PPLAMALLGPRF----------EAQT-----
-25==            --------------------------------MIAVSGPSY----------EAFS-----
-26==            ----------------------------------MANQLSY----------SSLG-----
-27==            ---------------------------------------MV----------ESTT-----
-28==            ----------------------------------------M----------GRDL-----
-29==            ---------MMDVNSSGRPDLYGHLRSF-LLPEVGRGLPDL----------SPDGGADPV
+9==             ----------------------------------------MAQQWSLQRLAGRHPQDSYE
+10==            ----------------------------------------MAQQWSLQRLAGRHPQDSYE
+11==            ----------------------------------------MTEAWNVAVFAARRSRDD-D
+12==            ----------------------------------------MAA-WEAAFAARRRHEE--E
+13==            ----------------------------------------MS-----------------S
+14==            ----------MESGNVSS------------SLFGNVST-ALRP----------------E
+15==            ----------MEYHNVSS------------VL-GNVSS-VLRP----------------D
+16==            ----------ME------------------PL-CNASEPPLRP----------------E
+17==            ----------MD------------------AL-CNASEPPLRP----------------E
+18==            --------------------------------MTNATGPQMAY----------------Y
+19==            --------------------------------MANVTGPQMAF----------------Y
+20==            ----------ME----SF------------AVAAAQLGPHFAP----------------L
+21==            ----------ME----SF------------AVAAAQLGPHFAP----------------L
+22==            ----------MD----SF------------AAVATQLGPQFAA----------------P
+23==            -----MERSHLP----ET------------PFDLAHSGPRFQA----------------Q
+24==            -----MERSLLP----EP------------PLAMALLGPRFEA----------------Q
+25==            --------------------------------MIAVSGPSYEA----------------F
+26==            ----------------------------------MANQLSYSS----------------L
+27==            ---------------------------------------MVES----------------T
+28==            ----------------------------------------MGR----------------D
+29==            ---------MMDVNSSGRPDLYGHLRSFL-LPEVGRGLPDLSPDGGA------------D
 30==            ------------------------------------------------------------
 31=p            ------------------------------------------------------------
-32==            ----------MDVLSPG------------QGNNTTSPPAPF----------ETGG-----
-33=p            ----------MDVFSFG------------QGNNTTASQEPF----------GTGG-----
-34==            MANFTFGDLALDVARMG-----GLASTPSGLRSTGLTTPGL----------SPTG-----
-35=p            MANFTFGDLALDVARMG-----GLASTPSGLRSTGLTTPGL----------SPTG-----
-36==            -MEGAEGQEELDWEAL-------YLRLP--LQNCSWNSTGW----------EPNW-----
+32==            ----------MDVLSP--------------------------------------------
+33=p            ----------MDVFSF--------------------------------------------
+34==            MANFTFGDLALDVARMG-----GLASTPSGLRSTGLTTPGLSPTGLV------------T
+35=p            MANFTFGDLALDVARMG-----GLASTPSGLRSTGLTTPGLSPTGLV------------T
+36==            -MEGAEGQEELDWEAL-------YLRLP--LQNCSWNSTGWEPNWNV------------T
                                                                             
 
-1==             -------------YVP-----F-SNKTG----------LARSPYEYPQY-YLAEPWK---
-2==             -------------YVP-----F-SNITG----------VVRSPFEQPQY-YLAEPWQ---
-3==             -------------YVP-----M-SNKTG----------VVRSPFEYPQY-YLAEPWK---
-4=p             -------------YVP-----M-SNRTG----------LVRSPFEYPQY-YLAEPWQ---
-5=p             -------------YVP-----L-SNRTG----------LVRSPFEYPQY-YLAEPWQ---
-6==             -------------YIPIP-LDI-NNLS------------AYSPFLVPQD-HLGNQGI---
-7==             -------------YL------F-KNIS------------SVGPWDGPQY-HIAPVWA---
+1==             E--G--DNFYVP----FSNKTGLARSPYEYPQY-------YLAEPWK---------YSAL
+2==             E--G--PNFYVP----FSNITGVVRSPFEQPQY-------YLAEPWQ---------FSML
+3==             E--G--INFYVP----MSNKTGVVRSPFEYPQY-------YLAEPWK---------YRLV
+4=p             E--G--KNFYVP----MSNRTGLVRSPFEYPQY-------YLAEPWQ---------FKIL
+5=p             E--G--NNFYVP----LSNRTGLVRSPFEYPQY-------YLAEPWQ---------FKLL
+6==             PEFH--EDFYIPIPLDINNLS--AYSPFLVPQD-------HLGNQGI---------FMAM
+7==             S--E--EEFYL-----FKNIS--SVGPWDGPQY-------HIAPVWA---------FYLQ
 8=opsin,        ------------------------------------------------------------
-9==             -------------QSSI--FTY-TNSNS-----------TRGPFEGPNY-HIAPRWV---
-10==            -------------QSSI--FTY-TNSNS-----------TRGPFEGPNY-HIAPRWV---
-11==            -------------RGSV--FTY-TNTNN-----------TRGPFEGPNY-HIAPRWV---
-12==            -------------RDSV--FTY-TNSNN-----------TRGPFEGPNY-HIAPRWV---
-13==            -------------QAP---------PNG-----------TPGPFDGPQWPYQAPQST---
-14==            -------------RLSA------ETRLL----------GWNVPPEELR--HIPEHWLTYP
-15==            -------------RLSA------ESRLL----------GWNVPPDELR--HIPEHWLIYP
-16==            -------------R-SSG---NGDLQFL----------GWNVPPDQIQ--YIPEHWLTQL
-17==            -------------RMSSG---SDELQFL----------GWNVPPDQIQ--YIPEHWLTQL
-18==            -------------AASMD-FGYPEGVSI----------VDFVRPEIKP--YVHQHWYNYP
-19==            -------------SGAAT-FGYPEGMTV----------ADFVPDRVKH--MVLDHWYNYP
-20==            ------------------------NGSV----------VDKVTPDMAH--LISPYWNQFP
-21==            ------------------------NGSV----------VDKVTPDMAH--LISPYWNQFP
-22==            ------------------------NGSV----------VDKVTPDMAH--LISPYWDQFP
-23==            -------------SG---------NGSV----------LDNVLPDMAH--LVNPYWSRFA
-24==            -------------GG---------NRSV----------LDNVLPDMAP--LVNPHWSRFA
-25==            -------------YGGQARF---NNQTV----------VDKVPPDMLH--LIDANWYQYP
-26==            -------------WPYQP------NASV----------VDTMPKEMLY--MIHEHWYAFP
-27==            -------------LVNQT-WWY--NPTV----------D------------IHPHWAKFD
-28==            -------------RDNET-WWY--NPSI----------V------------VHPHWREFD
-29==            AGSWAPHLLS---EVTAS-----PAPTW------------DAPPDNAS--GCGEQIN---
-30==            ----MPHLLSGFLEVTAS-----PAPTW------------DAPPDNVS--GCGEQIN---
-31=p            ----MPHLLSGFLEVTAS-----PAPTW------------DAPPDNVS--GCGEQIN---
-32==            -------------NTTGI-----SDVTV--------------------------------
-33=p            -------------NVTSI-----SDVTF--------------------------------
-34==            -------------LVTSD-----FNDSYGLTGQFINGSHSSRSRDNAS--ANDTSATNMT
-35=p            -------------LVTSD-----FNDSYGLTGQFINGSHSSRSRDNAS--ANDTSATNMT
-36==            -------------NVTVV-----PNTTW---------WQASAPFDTPA--ALVRAAAK--
-                                                                            
-
-1==             --------------YSALAAYMFFLILVGFPVNFLTLFVTVQHKKLRTPLNYILLNLAMA
-2==             --------------FSMLAAYMFLLIVLGFPINFLTLYVTVQHKKLRTPLNYILLNLAVA
-3==             --------------YRLVCCYIFFLISTGLPINLLTLLVTFKHKKLRQPLNYILVNLAVA
-4=p             --------------FKILALYLFFLMSMGLPINGLTLVVTAQHKKLRQPLNFILVNLAVA
-5=p             --------------FKLLAVYMFFLICLGLPINGLTLICTAQHKKLRQPLNFILVNLAVA
-6==             --------------FMAMSVFMFFIFIGGASINILTILCTIQFKKLRSHLNYILVNLSIA
-7==             --------------FYLQAAFMGTVFLIGFPLNAMVLVATLRYKKLRQPLNYILVNVSFG
-8=opsin,        ------------------------------------------------------------
-9==             --------------YHLTSVWMIFVVIASVFTNGLVLAATMKFKKLRHPLNWILVNLAVA
-10==            --------------YHLTSVWMIFVVTASVFTNGLVLAATMKFKKLRHPLNWILVNLAVA
-11==            --------------YNLVSFFMIIVVIASCFTNGLVLVATAKFKKLRHPLNWILVNLAFV
-12==            --------------YNLTSVWMIFVVAASVFTNGLVLVATWKFKKLRHPLNWILVNLAVA
-13==            --------------YVGVAVLMGTVVACASVVNGLVIVVSICYKKLRSPLNYILVNLAVA
-14==            E--------PPESMNYLLGTLYIFFTLMSMLGNGLVIWVFSAAKSLRTPSNILVINLAFC
-15==            E--------PPESMNYLLGTLYIFFTVISMIGNGLVMWVFSAAKSLRTPSNILVINLAFC
-16==            E--------PPASMHYMLGVFYIFLFCASTVGNGMVIWIFSTSKSLRTPSNMFVLNLAVF
-17==            E--------PPASMHYMLGVFYIFLFFASTLGNGMVIWIFSTSKSLRTPSNMFVLNLAVF
-18==            P--------VNPMWHYLLGVIYLFLGTVSIFGNGLVIYLFNKSAALRTPANILVVNLALS
-19==            P--------VNPMWHYLLGVVYLFLGVISIAGNGLVIYLYMKSQALKTPANMLIVNLALS
-20==            A--------MDPIWAKILTAYMIMIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAIS
-21==            A--------MDPIWAKILTAYMIMIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAIS
-22==            A--------MDPIWAKILTAYMIIIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAIS
-23==            P--------MDPMMSKILGLFTLAIMIISCCGNGVVVYIFGGTKSLRTPANLLVLNLAFS
-24==            P--------MDPTMSKILGLFTLVILIISCCGNGVVVYIFGGTKSLRTPANLLVLNLAFS
-25==            P--------LNPMWHGILGFVIGMLGFVSAMGNGMVVYIFLSTKSLRTPSNLFVINLAIS
-26==            P--------MNPLWYSILGVAMIILGIICVLGNGMVIYLMMTTKSLRTPTNLLVVNLAFS
-27==            P--------IPDAVYYSVGIFIGVVGIIGILGNGVVIYLFSKTKSLQTPANMFIINLAMS
-28==            Q--------VPDAVYYSLGIFIGICGIIGCGGNGIVIYLFTKTKSLQTPANMFIINLAFS
-29==            ---------YGRVEKVVIGSILTLITLLTIAGNCLVVISVCFVKKLRQPSNYLIVSLALA
-30==            ---------YGRVEKVVIGSILTLITLLTIAGNCLVVISVSFVKKLRQPSNYLIVSLALA
-31=p            ---------YGRVEKVVIGSILTLITLLTIAGNCLVVISVSFVKKLRQPSNYLIVSLALA
-32==            ------------SYQVITSLLLGTLIFCAVLGNACVVAAIALERSLQNVANYLIGSLAVT
-33=p            ------------SYQVITSLLLGTLIFCAVLGNACVVAAIALERSLQNVANYLIGSLAVT
-34==            DDRYWSLTVYSHEHLVLTSVILGLFVLCCIIGNCFVIAAVMLERSLHNVANYLILSLAVA
-35=p            DDRYWSLTVYSHEHLVLTSVILGLFVLCCIIGNCFVIAAVMLERSLHNVANYLILSLAVA
-36==            ------------------AVVLGLLILATVVGNVFVIAAILLERHLRSAANNLILSLAVA
+9==             DSTQ--SSIFT-----YTNSNS-TRGPFEGPNY-------HIAPRWV---------YHLT
+10==            DSTQ--SSIFT-----YTNSNS-TRGPFEGPNY-------HIAPRWV---------YHLT
+11==            DTTR--GSVFT-----YTNTNN-TRGPFEGPNY-------HIAPRWV---------YNLV
+12==            DTTR--DSVFT-----YTNSNN-TRGPFEGPNY-------HIAPRWV---------YNLT
+13==            NSSQ--AP-----------PNG-TPGPFDGPQW------PYQAPQST---------YVGV
+14==            ARLS--A----------ETRLLGWNVPPEELR--------HIPEHWLTYPEPPESMNYLL
+15==            ARLS--A----------ESRLLGWNVPPDELR--------HIPEHWLIYPEPPESMNYLL
+16==            AR-S--SG---N----GDLQFLGWNVPPDQIQ--------YIPEHWLTQLEPPASMHYML
+17==            ARMS--SG---S----DELQFLGWNVPPDQIQ--------YIPEHWLTQLEPPASMHYML
+18==            GAAS--MD-FGY----PEGVSIVDFVRPEIKP--------YVHQHWYNYPPVNPMWHYLL
+19==            GSGA--AT-FGY----PEGMTVADFVPDRVKH--------MVLDHWYNYPPVNPMWHYLL
+20==            S-----------------NGSVVDKVTPDMAH--------LISPYWNQFPAMDPIWAKIL
+21==            S-----------------NGSVVDKVTPDMAH--------LISPYWNQFPAMDPIWAKIL
+22==            S-----------------NGSVVDKVTPDMAH--------LISPYWDQFPAMDPIWAKIL
+23==            SSG---------------NGSVLDNVLPDMAH--------LVNPYWSRFAPMDPMMSKIL
+24==            TGG---------------NRSVLDNVLPDMAP--------LVNPHWSRFAPMDPTMSKIL
+25==            SYGG--QARF-------NNQTVVDKVPPDMLH--------LIDANWYQYPPLNPMWHGIL
+26==            GWPY--QP----------NASVVDTMPKEMLY--------MIHEHWYAFPPMNPLWYSIL
+27==            TLVN--QT-WWY------NPTVD------------------IHPHWAKFDPIPDAVYYSV
+28==            LRDN--ET-WWY------NPSIV------------------VHPHWREFDQVPDAVYYSL
+29==            PVAGSWAPHLLS------EVTASPAPTWDAPPDNASGCGEQIN--------YGRVEKVVI
+30==            ------MPHLLS---GFLEVTASPAPTWDAPPDNVSGCGEQIN--------YGRVEKVVI
+31=p            ------MPHLLS---GFLEVTASPAPTWDAPPDNVSGCGEQIN--------YGRVEKVVI
+32==            ---------------GQGNNTTSPPAPFET-GGNTTGISDVT---------VSYQ--VIT
+33=p            ---------------GQGNNTTASQEPFGT-GGNVTSISDVT---------FSYQ--VIT
+34==            SDFN--DSYGLT---GQFINGSHSSRSRDNASANDTSATNMTDDRYWSLTVYSHEHLVLT
+35=p            SDFN--DSYGLT---GQFINGSHSSRSRDNASANDTSATNMTDDRYWSLTVYSHEHLVLT
+36==            VVPN--TTWW------------QASAPFDTPAALVRAAAK--------------------
                                                                             
 
-1==             NLFMVLFG-FTVTMYTSMN-GYFV--FGPTMCSIEGFFATLGGEVALWSLVVLAIERYIV
-2==             DLFMVFGG-FTTTLYTSLH-GYFV--FGPTGCNLEGFFATLGGEIGLWSLVVLAIERYVV
-3==             DLFMACFG-FTVTFYTAWN-GYFV--FGPVGCAVEGFFATLGGQVALWSLVVLAIERYIV
-4=p             GTIMVCFG-FTVTFYTAIN-GYFV--LGPTGCAVEGFMATLGGEVALWSLVVLAIERYIV
-5=p             GAIMVCFG-FTVTFYTAIN-GYFA--LGPTGCAVEGFMATLGGEVALWSLVVLAIERYIV
-6==             NLFVAIFG-SPLSFYSFFN-RYFI--FGATACKIEGFLATLGGMVGLWSLAVVAFERWLV
-7==             GFLLCIFS-VFPVFVASCN-GYFV--FGRHVCALEGFLGTVAGLVTGWSLAFLAFERYIV
-8=opsin,        DLAETVIA-STISIVNQVS-GYFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWLV
-9==             DLAETVIA-STISVVNQVY-GYFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWMV
-10==            DLAETVIA-STISIVNQVS-GYFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWLV
-11==            DLVETLVA-STISVFNQIF-GYFI--LGHPLCVIEGYVVSSCGITGLWSLAIISWERWFV
-12==            DLGETVIA-STISVINQIS-GYFI--LGHPMCVVEGYTVSACGITALWSLAIISWERWFV
-13==            DLLVTLCG-SSVSLSNNIN-GFFV--FGRRMCELEGFMVSLTGIVGLWSLAILALERYVV
-14==            DFMMMVK--TPIFIYNSFH-QGYA--LGHLGCQIFGIIGSYTGIAAGATNAFIAYDRFNV
-15==            DFMMMIK--TPIFIYNSFH-QGYA--LGHLGCQIFGVIGSYTGIAAGATNAFIAYDRYNV
-16==            DLIMCLK--APIF--NSFH-RGFAIYLGNTWCQIFASIGSYSGIGAGMTNAAIGYDRYNV
-17==            DLIMCLK--APIFIYNSFH-RGFA--LGNTWCQIFASIGSYSGIGAGMTNAAIGYDRYNV
-18==            DLIMLTTN-VPFFTYNCFSGGVWM--FSPQYCEIYACLGAITGVCSIWLLCMISFDRYNI
-19==            DLIMLTTN-FPPFCYNCFSGGRWM--FSGTYCEIYAALGAITGVCSIWTLCMISFDRYNI
-20==            DFGIMITN-TPMMGINLYF-ETWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQV
-21==            DFGIMITN-TPMMGINLYF-ETWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQV
-22==            DFGIMITN-TPMMGINLYF-ETWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQV
-23==            DFCMMASQ-SPVMIINFYY-ETWV--LGPLWCDIYAGCGSLFGCVSIWSMCMIAFDRYNV
-24==            DFCMMASQ-SPVMIINFYY-ETWV--LGPLWCDIYAACGSLFGCVSIWSMCMIAFDRYNV
-25==            NFLMMFCM-SPPMVINCYY-ETWV--LGPLFCQIYAMLGSLFGCGSIWTMTMIAFDRYNV
-26==            DFCMMAFM-MPTMTSNCFA-ETWI--LGPFMCEVYGMAGSLFGCASIWSMVMITLDRYNV
-27==            DLSFSAINGFPLKTISAFM-KKWI--FGKVACQLYGLLGGIFGFMSINTMAMISIDRYNV
-28==            DFTFSLVNGFPLMTISCFL-KKWI--FGFAACKVYGFIGGIFGFMSIMTMAMISIDRYNV
-29==            DLSVAVAV-MPFVSVTDLIGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYLG
-30==            DLSVAVAV-MPFVSVTDLIGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYLG
-31=p            DLSVAVAV-MPFVSVTDLIGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYLG
-32==            DLMVSVLV-LPMAALYQVL-NKWT--LGQVTCDLFIALDVLCCTSSILHLCAIALDRYWA
-33=p            DLMVSVLV-LPMAALYQVL-NKWT--LGQVTCDLFIALDVLCCTSSILHLCAIALDRYWA
-34==            DLMVAVLV-MPLSVVSEIS-KVWF--LHSEVCDMWISVDVLCCTASILHLVAIAMDRYWA
-35=p            DLMVAVLV-MPLSVVSEIS-KVWF--LHSEVCDMWISVDVLCCTASILHLVAIAMDRYWA
-36==            DLLVACLV-MPLGAVYEVV-QRWT--LGPELCDMWTSGDVLCCTASILHLVAIALDRYWA
-                .                     :   :    * :                  :  :*:  
+1==             AAYMFFLILVGFPVNFLTLFVTVQHKKLRTPLNYILLNLAMANLFMVLFG-FTVTMYTSM
+2==             AAYMFLLIVLGFPINFLTLYVTVQHKKLRTPLNYILLNLAVADLFMVFGG-FTTTLYTSL
+3==             CCYIFFLISTGLPINLLTLLVTFKHKKLRQPLNYILVNLAVADLFMACFG-FTVTFYTAW
+4=p             ALYLFFLMSMGLPINGLTLVVTAQHKKLRQPLNFILVNLAVAGTIMVCFG-FTVTFYTAI
+5=p             AVYMFFLICLGLPINGLTLICTAQHKKLRQPLNFILVNLAVAGAIMVCFG-FTVTFYTAI
+6==             SVFMFFIFIGGASINILTILCTIQFKKLRSHLNYILVNLSIANLFVAIFG-SPLSFYSFF
+7==             AAFMGTVFLIGFPLNAMVLVATLRYKKLRQPLNYILVNVSFGGFLLCIFS-VFPVFVASC
+8=opsin,        ------------------------------------------DLAETVIA-STISIVNQV
+9==             SVWMIFVVIASVFTNGLVLAATMKFKKLRHPLNWILVNLAVADLAETVIA-STISVVNQV
+10==            SVWMIFVVTASVFTNGLVLAATMKFKKLRHPLNWILVNLAVADLAETVIA-STISIVNQV
+11==            SFFMIIVVIASCFTNGLVLVATAKFKKLRHPLNWILVNLAFVDLVETLVA-STISVFNQI
+12==            SVWMIFVVAASVFTNGLVLVATWKFKKLRHPLNWILVNLAVADLGETVIA-STISVINQI
+13==            AVLMGTVVACASVVNGLVIVVSICYKKLRSPLNYILVNLAVADLLVTLCG-SSVSLSNNI
+14==            GTLYIFFTLMSMLGNGLVIWVFSAAKSLRTPSNILVINLAFCDFMMMVK--TPIFIYNSF
+15==            GTLYIFFTVISMIGNGLVMWVFSAAKSLRTPSNILVINLAFCDFMMMIK--TPIFIYNSF
+16==            GVFYIFLFCASTVGNGMVIWIFSTSKSLRTPSNMFVLNLAVFDLIMCLK--APIF--NSF
+17==            GVFYIFLFFASTLGNGMVIWIFSTSKSLRTPSNMFVLNLAVFDLIMCLK--APIFIYNSF
+18==            GVIYLFLGTVSIFGNGLVIYLFNKSAALRTPANILVVNLALSDLIMLTTN-VPFFTYNCF
+19==            GVVYLFLGVISIAGNGLVIYLYMKSQALKTPANMLIVNLALSDLIMLTTN-FPPFCYNCF
+20==            TAYMIMIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAISDFGIMITN-TPMMGINLY
+21==            TAYMIMIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAISDFGIMITN-TPMMGINLY
+22==            TAYMIIIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAISDFGIMITN-TPMMGINLY
+23==            GLFTLAIMIISCCGNGVVVYIFGGTKSLRTPANLLVLNLAFSDFCMMASQ-SPVMIINFY
+24==            GLFTLVILIISCCGNGVVVYIFGGTKSLRTPANLLVLNLAFSDFCMMASQ-SPVMIINFY
+25==            GFVIGMLGFVSAMGNGMVVYIFLSTKSLRTPSNLFVINLAISNFLMMFCM-SPPMVINCY
+26==            GVAMIILGIICVLGNGMVIYLMMTTKSLRTPTNLLVVNLAFSDFCMMAFM-MPTMTSNCF
+27==            GIFIGVVGIIGILGNGVVIYLFSKTKSLQTPANMFIINLAMSDLSFSAINGFPLKTISAF
+28==            GIFIGICGIIGCGGNGIVIYLFTKTKSLQTPANMFIINLAFSDFTFSLVNGFPLMTISCF
+29==            GSILTLITLLTIAGNCLVVISVCFVKKLRQPSNYLIVSLALADLSVAVAV-MPFVSVTDL
+30==            GSILTLITLLTIAGNCLVVISVSFVKKLRQPSNYLIVSLALADLSVAVAV-MPFVSVTDL
+31=p            GSILTLITLLTIAGNCLVVISVSFVKKLRQPSNYLIVSLALADLSVAVAV-MPFVSVTDL
+32==            SLLLGTLIFCAVLGNACVVAAIALERSLQNVANYLIGSLAVTDLMVSVLV-LPMAALYQV
+33=p            SLLLGTLIFCAVLGNACVVAAIALERSLQNVANYLIGSLAVTDLMVSVLV-LPMAALYQV
+34==            SVILGLFVLCCIIGNCFVIAAVMLERSLHNVANYLILSLAVADLMVAVLV-MPLSVVSEI
+35=p            SVILGLFVLCCIIGNCFVIAAVMLERSLHNVANYLILSLAVADLMVAVLV-MPLSVVSEI
+36==            AVVLGLLILATVVGNVFVIAAILLERHLRSAANNLILSLAVADLLVACLV-MPLGAVYEV
+                                                          .                 
+
+1==             N-GYFV--FGPTMCSIEGFFATLGGEVALWSLVVLAIERYIVICKPMGN-FRFGNTHAIM
+2==             H-GYFV--FGPTGCNLEGFFATLGGEIGLWSLVVLAIERYVVVCKPMSN-FRFGENHAIM
+3==             N-GYFV--FGPVGCAVEGFFATLGGQVALWSLVVLAIERYIVVCKPMGN-FRFSATHAMM
+4=p             N-GYFV--LGPTGCAVEGFMATLGGEVALWSLVVLAIERYIVVCKPMGS-FKFSSSHAFA
+5=p             N-GYFA--LGPTGCAVEGFMATLGGEVALWSLVVLAIERYIVVCKPMGS-FKFSSTHASA
+6==             N-RYFI--FGATACKIEGFLATLGGMVGLWSLAVVAFERWLVICKPLGN-FTFKTPHAIA
+7==             N-GYFV--FGRHVCALEGFLGTVAGLVTGWSLAFLAFERYIVICKPFGN-FRFSSKHALT
+8=opsin,        S-GYFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWLVVCKPFGN-VRFDAKLAIV
+9==             Y-GYFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWMVVCKPFGN-VRFDAKLAIV
+10==            S-GYFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWLVVCKPFGN-VRFDAKLAIV
+11==            F-GYFI--LGHPLCVIEGYVVSSCGITGLWSLAIISWERWFVVCKPFGN-IKFDSKLAII
+12==            S-GYFI--LGHPMCVVEGYTVSACGITALWSLAIISWERWFVVCKPFGN-IKFDGKLAVA
+13==            N-GFFV--FGRRMCELEGFMVSLTGIVGLWSLAILALERYVVVCKPLGD-FQFQRRHAVS
+14==            H-QGYA--LGHLGCQIFGIIGSYTGIAAGATNAFIAYDRFNVITRPMEG--KMTHGKAIA
+15==            H-QGYA--LGHLGCQIFGVIGSYTGIAAGATNAFIAYDRYNVITRPMEG--KMTHGKAIA
+16==            H-RGFAIYLGNTWCQIFASIGSYSGIGAGMTNAAIGYDRYNVITKPMNR--NMTFTKAVI
+17==            H-RGFA--LGNTWCQIFASIGSYSGIGAGMTNAAIGYDRYNVITKPMNR--NMTFTKAVI
+18==            SGGVWM--FSPQYCEIYACLGAITGVCSIWLLCMISFDRYNIICNGFNG-PKLTTGKAVV
+19==            SGGRWM--FSGTYCEIYAALGAITGVCSIWTLCMISFDRYNIICNGFNG-PKLTQGKATF
+20==            F-ETWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQVIVKGMAG-RPMTIPLALG
+21==            F-ETWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQVIVKGMAG-RPMTIPLALG
+22==            F-ETWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQVIVKGMAG-RPMTIPLALG
+23==            Y-ETWV--LGPLWCDIYAGCGSLFGCVSIWSMCMIAFDRYNVIVKGING-TPMTIKTSIM
+24==            Y-ETWV--LGPLWCDIYAACGSLFGCVSIWSMCMIAFDRYNVIVKGING-TPMTIKTSIM
+25==            Y-ETWV--LGPLFCQIYAMLGSLFGCGSIWTMTMIAFDRYNVIVKGLSG-KPLSINGALI
+26==            A-ETWI--LGPFMCEVYGMAGSLFGCASIWSMVMITLDRYNVIVRGMAA-APLTHKKATL
+27==            M-KKWI--FGKVACQLYGLLGGIFGFMSINTMAMISIDRYNVIGRPMAASKKMSHRRAFL
+28==            L-KKWI--FGFAACKVYGFIGGIFGFMSIMTMAMISIDRYNVIGRPMAASKKMSHRRAFI
+29==            IGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYLGITRPLTYPVRQNGKCMAK
+30==            IGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYLGITRPLTYPVRQNGKCMAK
+31=p            IGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYLGITRPLTYPVRQNGKCMAK
+32==            L-NKWT--LGQVTCDLFIALDVLCCTSSILHLCAIALDRYWAITDPIDYVNKRTPRRAAA
+33=p            L-NKWT--LGQVTCDLFIALDVLCCTSSILHLCAIALDRYWAITDPIDYVNKRTPRRAAA
+34==            S-KVWF--LHSEVCDMWISVDVLCCTASILHLVAIAMDRYWAVTS-IDYIRRRSARRILL
+35=p            S-KVWF--LHSEVCDMWISVDVLCCTASILHLVAIAMDRYWAVTS-IDYIRRRSARRILL
+36==            V-QRWT--LGPELCDMWTSGDVLCCTASILHLVAIALDRYWAVTN-IDYIHASTAKRVGM
+                    :   :    * :                  :  :*:  :   :             
 
-1==             ICKPMGN-FRFGNTHAIMGVAFTWIMALAC-AAPPLVG-W-----SRYIPEGMQCSCGPD
-2==             VCKPMSN-FRFGENHAIMGVAFTWVMALAC-AAPPLVG-W-----SRYIPEGMQCSCGID
-3==             VCKPMGN-FRFSATHAMMGIAFTWVMAFSC-AAPPLFG-W-----SRYMPEGMQCSCGPD
-4=p             VCKPMGS-FKFSSSHAFAGIAFTWVMALAC-AAPPLFG-W-----SRYIPEGMQCSCGPD
-5=p             VCKPMGS-FKFSSTHASAGIAFTWVMAMAC-AAPPLVG-W-----SRYIPEGIQCSCGPD
-6==             ICKPLGN-FTFKTPHAIAGCILPWISALAA-SLPPLFG-W-----SRYIPEGLQCSCGPD
-7==             ICKPFGN-FRFSSKHALTVVLATWTIGIGV-SIPPFFG-W-----SRFIPEGLQCSCGPD
-8=opsin,        VCKPFGN-VRFDAKLAIVGIAFSWIWAAVW-TAPPIFG-W-----SRYWPHGLKTSCGPD
-9==             VCKPFGN-VRFDAKLAIVGIAFSWIWAAVW-TAPPIFG-W-----SRYWPHGLKTSCGPD
-10==            VCKPFGN-VRFDAKLAIVGIAFSWIWSAVW-TAPPIFG-W-----SRYWPHGLKTSCGPD
-11==            VCKPFGN-IKFDSKLAIIGIVFSWVWAWGW-SAPPIFG-W-----SRYWPHGLKTSCGPD
-12==            VCKPFGN-IKFDGKLAVAGILFSWLWSCAW-TAPPIFG-W-----SRYWPHGLKTSCGPD
-13==            VCKPLGD-FQFQRRHAVSGCAFTWGWALLW-SAPPLLG-W-----SSYVPEGLRTSCGPN
-14==            ITRPMEG--KMTHGKAIAMIIFIYMYATPW-VVACYTETW-----GRFVPEGYLTSCTFD
-15==            ITRPMEG--KMTHGKAIAMIIFIYLYATPW-VVACYTESW-----GRFVPEGYLTSCTFD
-16==            ITKPMNR--NMTFTKAVIMNIIIWLYCTPW-VVLPLTQFW-----DRFVPEGYLTSCSFD
-17==            ITKPMNR--NMTFTKAVIMNIIIWLYCTPW-VVLPLTQFW-----DRFVPEGYLTSCSFD
-18==            ICNGFNG-PKLTTGKAVVFALISWVIAIGC-ALPPFFG-W-----GNYILEGILDSCSYD
-19==            ICNGFNG-PKLTQGKATFMCGLAWVISVGW-SLPPFFG-W-----GSYTLEGILDSCSYD
-20==            IVKGMAG-RPMTIPLALGKM---------------------------YVPEGNLTSCGID
-21==            IVKGMAG-RPMTIPLALGKIAYIWFMSSIW-CLAPAFG-W-----SRYVPEGNLTSCGID
-22==            IVKGMAG-RPMTIPLALGKIAYIWFMSTIWCCLAPVFG-W-----SRYVPEGNLTSCGID
-23==            IVKGING-TPMTIKTSIMKILFIWMMAVFW-TVMPLIG-W-----SAYVPEGNLTACSID
-24==            IVKGING-TPMTIKTSIMKIAFIWMMAVFW-TIMPLIG-W-----SSYVPEGNLTACSID
-25==            IVKGLSG-KPLSINGALIRIIAIWLFSLGW-TIAPMFG-W-----NRYVPEGNMTACGTD
-26==            IVRGMAA-APLTHKKATLLLLFVWIWSGGW-TILPFFG-W-----SRYVPEGNLTSCTVD
-27==            IGRPMAASKKMSHRRAFLMIIFVWMWSIVW-SVGPVFN-W-----GAYVPEGILTSCSFD
-28==            IGRPMAASKKMSHRRAFIMIIFVWLWSVLW-AIGPIFG-W-----GAYTLEGVLCNCSFD
-29==            ITRPLTYPVRQNGKCMAKMILSVWLLSASI-TLPPLFG-W-----AQNVNDDKVCLISQD
-30==            ITRPLTYPVRQNGKCMAKMILSVWLLSASI-TLPPLFG-W-----AQNVNDDKVCLISQD
-31=p            ITRPLTYPVRQNGKCMAKMILSVWLLSASI-TLPPLFG-W-----AQNVNDDKVCLISQD
-32==            ITDPIDYVNKRTPRRAAALISLTWLIGFLI-SIPPMLG-WRTPEDRSDPDA---CTISKD
-33=p            ITDPIDYVNKRTPRRAAALISLTWLIGFLI-SIPPMLG-WRTPEDRSDPDA---CTISKD
-34==            VTS-IDYIRRRSARRILLMIMVVWIVALFI-SIPPLFG-WRDP--NNDPDKTGTCIISQD
-35=p            VTS-IDYIRRRSARRILLMIMVVWIVALFI-SIPPLFG-WRDP--NNDPDKTGTCIISQD
-36==            VTN-IDYIHASTAKRVGMMIACVWTVSFFV-CIAQLLG-WKDPDWNQRVSEDLRCVVSQD
-                :   :                                                      :
+1==             GVAFTWIMALAC-AAPPLVG-W-----SRYIPEGMQCSCGPDYYTLNPNFNNESYVVYMF
+2==             GVAFTWVMALAC-AAPPLVG-W-----SRYIPEGMQCSCGIDYYTLKPEVNNESFVIYMF
+3==             GIAFTWVMAFSC-AAPPLFG-W-----SRYMPEGMQCSCGPDYYTHNPDYHNESYVLYMF
+4=p             GIAFTWVMALAC-AAPPLFG-W-----SRYIPEGMQCSCGPDYYTLNPDYNNESYVIYMF
+5=p             GIAFTWVMAMAC-AAPPLVG-W-----SRYIPEGIQCSCGPDYYTLNPEYNNESYVLYMF
+6==             GCILPWISALAA-SLPPLFG-W-----SRYIPEGLQCSCGPDWYTTNNKYNNESYVMFLF
+7==             VVLATWTIGIGV-SIPPFFG-W-----SRFIPEGLQCSCGPDWYTVGTKYRSESYTWFLF
+8=opsin,        GIAFSWIWAAVW-TAPPIFG-W-----SRYWPHGLKTSCGPDVFSGSSYPGVQSYMIVLM
+9==             GIAFSWIWAAVW-TAPPIFG-W-----SRYWPHGLKTSCGPDVFSGSSYPGVQSYMIVLM
+10==            GIAFSWIWSAVW-TAPPIFG-W-----SRYWPHGLKTSCGPDVFSGSSYPGVQSYMIVLM
+11==            GIVFSWVWAWGW-SAPPIFG-W-----SRYWPHGLKTSCGPDVFSGSVELGCQSFMLTLM
+12==            GILFSWLWSCAW-TAPPIFG-W-----SRYWPHGLKTSCGPDVFSGSSDPGVQSYMVVLM
+13==            GCAFTWGWALLW-SAPPLLG-W-----SSYVPEGLRTSCGPNWYTGGSNN--NSYILSLF
+14==            MIIFIYMYATPW-VVACYTETW-----GRFVPEGYLTSCTFDYLT--DNFDTRLFVACIF
+15==            MIIFIYLYATPW-VVACYTESW-----GRFVPEGYLTSCTFDYLT--DNFDTRLFVACIF
+16==            MNIIIWLYCTPW-VVLPLTQFW-----DRFVPEGYLTSCSFDYLS--DNFDTRLFVGTIF
+17==            MNIIIWLYCTPW-VVLPLTQFW-----DRFVPEGYLTSCSFDYLS--DNFDTRLFVGTIF
+18==            FALISWVIAIGC-ALPPFFG-W-----GNYILEGILDSCSYDYLT--QDFNTFSYNIFIF
+19==            MCGLAWVISVGW-SLPPFFG-W-----GSYTLEGILDSCSYDYFT--RDMNTITYNICIF
+20==            KM---------------------------YVPEGNLTSCGIDYLE--RDWNPRSYLIFYS
+21==            KIAYIWFMSSIW-CLAPAFG-W-----SRYVPEGNLTSCGIDYLE--RDWNPRSYLIFYS
+22==            KIAYIWFMSTIWCCLAPVFG-W-----SRYVPEGNLTSCGIDYLE--RDWNPRSYLIFYS
+23==            KILFIWMMAVFW-TVMPLIG-W-----SAYVPEGNLTACSIDYMT--RMWNPRSYLITYS
+24==            KIAFIWMMAVFW-TIMPLIG-W-----SSYVPEGNLTACSIDYMT--RQWNPRSYLITYS
+25==            RIIAIWLFSLGW-TIAPMFG-W-----NRYVPEGNMTACGTDYFN--RGLLSASYLVCYG
+26==            LLLFVWIWSGGW-TILPFFG-W-----SRYVPEGNLTSCTVDYLT--KDWSSASYVVIYG
+27==            MIIFVWMWSIVW-SVGPVFN-W-----GAYVPEGILTSCSFDYLS--TDPSTRSFILCMY
+28==            MIIFVWLWSVLW-AIGPIFG-W-----GAYTLEGVLCNCSFDYIS--RDSTTRSNILCMF
+29==            MILSVWLLSASI-TLPPLFG-W-----AQNVNDDKVCLISQDF----------GYTIYST
+30==            MILSVWLLSASI-TLPPLFG-W-----AQNVNDDKVCLISQDF----------GYTIYST
+31=p            MILSVWLLSASI-TLPPLFG-W-----AQNVNDDKVCLISQDF----------GYTIYST
+32==            LISLTWLIGFLI-SIPPMLG-WRTPEDRSDPD---ACTISKDH----------GYTIYST
+33=p            LISLTWLIGFLI-SIPPMLG-WRTPEDRSDPD---ACTISKDH----------GYTIYST
+34==            MIMVVWIVALFI-SIPPLFG-WRDP--NNDPDKTGTCIISQDK----------GYTIFST
+35=p            MIMVVWIVALFI-SIPPLFG-WRDP--NNDPDKTGTCIISQDK----------GYTIFST
+36==            MIACVWTVSFFV-CIAQLLG-WKDPDWNQRVSEDLRCVVSQDV----------GYQIFAT
+                                                         :                  
 
-1==             YYTLNPNFNNESYVVYMFVVHFLVPFVIIFFCYGRLLCTV----KE--------------
-2==             YYTLKPEVNNESFVIYMFVVHFTIPMIVIFFCYGQLVFTV----KE--------------
-3==             YYTHNPDYHNESYVLYMFVIHFIIPVVVIFFSYGRLICKV----RE--------------
-4=p             YYTLNPDYNNESYVIYMFVCHFILPVAVIFFTYGRLVCTV----KA--------------
-5=p             YYTLNPEYNNESYVLYMFICHFILPVTIIFFTYGRLVCTV----KA--------------
-6==             WYTTNNKYNNESYVMFLFCFCFAVPFGTIVFCYGQLLITL----KL--------------
-7==             WYTVGTKYRSESYTWFLFIFCFIVPLSLICFSYTQLLRAL----KA--------------
-8=opsin,        VFSGSSYPGVQSYMIVLMVTCCITPLSIIVLCYLQVWLAI----RA--------------
-9==             VFSGSSYPGVQSYMIVLMVTCCITPLSIIVLCYLQVWLAI----RA--------------
-10==            VFSGSSYPGVQSYMIVLMVTCCIIPLAIIMLCYLQVWLAI----RA--------------
-11==            VFSGSVELGCQSFMLTLMITCCFLPLFIIIVCYLQVWMAI----RA--------------
-12==            VFSGSSDPGVQSYMVVLMVTCCFFPLAIIILCYLQVWLAI----RA--------------
-13==            WYTGGSNN--NSYILSLFVTCFVLPLSLILFSYTNLLLTL----RA--------------
-14==            YLT--DNFDTRLFVACIFFFSFVCPTTMITYYYSQIVGHVFSHEKA--------------
-15==            YLT--DNFDTRLFVACIFFFSFVCPTTMITYYYSQIVGHVFSHEKA--------------
-16==            YLS--DNFDTRLFVGTIFFFSFVCPTLMILYYYSQIVGHVFSHEKA--------------
-17==            YLS--DNFDTRLFVGTIFLFSFVVPTLMILYYYSQIVGHVFNHEKA--------------
-18==            YLT--QDFNTFSYNIFIFVFDYFLPAAIIVFSYVFIVKAIFAHEAA--------------
-19==            YFT--RDMNTITYNICIFIFDFFLPASVIVFSYVFIVKAIFAHEAA--------------
-20==            YLE--RDWNPRSYLIFYSIFVYYIPLFLICYSYWFIIAAVSAHEKA--------------
-21==            YLE--RDWNPRSYLIFYSIFVYYIPLFLICYSYWFIIAAVSAHEKA--------------
-22==            YLE--RDWNPRSYLIFYSIFVYYIPLFLICYSYWFIIAAVSAHEKA--------------
-23==            YMT--RMWNPRSYLITYSLFVYYTPLFLICYSYWFIIAAVAAHEKA--------------
-24==            YMT--RQWNPRSYLITYSLFVYYTPLFMICYSYWFIIATVAAHEKA--------------
-25==            YFN--RGLLSASYLVCYGIWVYFVPLFLIIYSYWFIIQAVAAHEKN--------------
-26==            YLT--KDWSSASYVVIYGLAVYFLPLITMIYCYFFIVHAVAEHEKQ--------------
-27==            YLS--TDPSTRSFILCMYFCGFMLPIIIIAFCYFNIVMSVSNHEKE--------------
-28==            YIS--RDSTTRSNILCMFILGFFGPILIIFFCYFNIVMSVSNHEKE--------------
-29==            F----------GYTIYSTAVAFYIPMSVMLFMYYQIYKAARKSAAKHKF-----------
-30==            F----------GYTIYSTAVAFYIPMSVMLFMYYQIYKAARKSAAKHKF-----------
-31=p            F----------GYTIYSTAVAFYIPMSVMLFMYYQIYKAARKSAAKHKF-----------
-32==            H----------GYTIYSTFGAFYIPLLLMLVLYGRIFRAARFRIRK--------------
-33=p            H----------GYTIYSTFGAFYIPLLLMLVLYGRIFRAARFRIRK--------------
-34==            K----------GYTIFSTVGAFYLPMLVMMIIYIRIWLVARSRIRKDKFQMTKARLKTEE
-35=p            K----------GYTIFSTVGAFYLPMLVMMIIYIRIWLVARSRIRKDKFQMTKARLKTEE
-36==            V----------GYQIFATASSFYVPVLIILILYWRIYQTARKRIR---------------
-                                        *   :   *  :                        
+1==             VVHFLVPFVIIFFCYGRLLCTV----KEAAAAQQ--------------------------
+2==             VVHFTIPMIVIFFCYGQLVFTV----KEAAAQQQ--------------------------
+3==             VIHFIIPVVVIFFSYGRLICKV----REAAAQQQ--------------------------
+4=p             VCHFILPVAVIFFTYGRLVCTV----KAAAAQQQ--------------------------
+5=p             ICHFILPVTIIFFTYGRLVCTV----KAAAAQQQ--------------------------
+6==             CFCFAVPFGTIVFCYGQLLITL----KLAAKAQA--------------------------
+7==             IFCFIVPLSLICFSYTQLLRAL----KAVAAQQQ--------------------------
+8=opsin,        VTCCITPLSIIVLCYLQVWLAI----RAVAKQQK--------------------------
+9==             VTCCITPLSIIVLCYLQVWLAI----RAVAKQQK--------------------------
+10==            VTCCIIPLAIIMLCYLQVWLAI----RAVAKQQK--------------------------
+11==            ITCCFLPLFIIIVCYLQVWMAI----RAVAAQQK--------------------------
+12==            VTCCFFPLAIIILCYLQVWLAI----RAVAAQQK--------------------------
+13==            VTCFVLPLSLILFSYTNLLLTL----RAAAAQQK--------------------------
+14==            FFSFVCPTTMITYYYSQIVGHVFSHEKALRDQAKK-------------------------
+15==            FFSFVCPTTMITYYYSQIVGHVFSHEKALRDQAKK-------------------------
+16==            FFSFVCPTLMILYYYSQIVGHVFSHEKALREQAKK-------------------------
+17==            LFSFVVPTLMILYYYSQIVGHVFNHEKALREQAKK-------------------------
+18==            VFDYFLPAAIIVFSYVFIVKAIFAHEAAMRAQAKK-------------------------
+19==            IFDFFLPASVIVFSYVFIVKAIFAHEAAMRAQAKK-------------------------
+20==            IFVYYIPLFLICYSYWFIIAAVSAHEKAMREQAKK-------------------------
+21==            IFVYYIPLFLICYSYWFIIAAVSAHEKAMREQAKK-------------------------
+22==            IFVYYIPLFLICYSYWFIIAAVSAHEKAMREQAKK-------------------------
+23==            LFVYYTPLFLICYSYWFIIAAVAAHEKAMREQAKK-------------------------
+24==            LFVYYTPLFMICYSYWFIIATVAAHEKAMRDQAKK-------------------------
+25==            IWVYFVPLFLIIYSYWFIIQAVAAHEKNMREQAKK-------------------------
+26==            LAVYFLPLITMIYCYFFIVHAVAEHEKQLREQAKK-------------------------
+27==            FCGFMLPIIIIAFCYFNIVMSVSNHEKEMAAMAKR-------------------------
+28==            ILGFFGPILIIFFCYFNIVMSVSNHEKEMAAMAKR-------------------------
+29==            AVAFYIPMSVMLFMYYQIY-------KAARKSAAKHKF----------------------
+30==            AVAFYIPMSVMLFMYYQIY-------KAARKSAAKHKF----------------------
+31=p            AVAFYIPMSVMLFMYYQIY-------KAARKSAAKHKF----------------------
+32==            FGAFYIPLLLMLVLYGRIF-------RAARFRIRK-------------------------
+33=p            FGAFYIPLLLMLVLYGRIF-------RAARFRIRK-------------------------
+34==            VGAFYLPMLVMMIIYIRIW-------LVARSRIRKDKFQMTKARLKTEETTLVASPKTEY
+35=p            VGAFYLPMLVMMIIYIRIW-------LVARSRIRKDKFQMTKARLKTEETTLVASPKTEY
+36==            ASSFYVPVLIILILYWRIY-------QTARKRIR--------------------------
+                      *   :   *  :                                          
 
-1==             ------------------------------------------------------AAAAQQ
-2==             ------------------------------------------------------AAAQQQ
-3==             ------------------------------------------------------AAAQQQ
-4=p             ------------------------------------------------------AAAQQQ
-5=p             ------------------------------------------------------AAAQQQ
-6==             ------------------------------------------------------AAKAQA
-7==             ------------------------------------------------------VAAQQQ
-8=opsin,        ------------------------------------------------------VAKQQK
-9==             ------------------------------------------------------VAKQQK
-10==            ------------------------------------------------------VAKQQK
-11==            ------------------------------------------------------VAAQQK
-12==            ------------------------------------------------------VAAQQK
-13==            ------------------------------------------------------AAAQQK
-14==            ------------------------------------------------------LRDQAK
-15==            ------------------------------------------------------LRDQAK
-16==            ------------------------------------------------------LREQAK
-17==            ------------------------------------------------------LREQAK
-18==            ------------------------------------------------------MRAQAK
-19==            ------------------------------------------------------MRAQAK
-20==            ------------------------------------------------------MREQAK
-21==            ------------------------------------------------------MREQAK
-22==            ------------------------------------------------------MREQAK
-23==            ------------------------------------------------------MREQAK
-24==            ------------------------------------------------------MRDQAK
-25==            ------------------------------------------------------MREQAK
-26==            ------------------------------------------------------LREQAK
-27==            ------------------------------------------------------MAAMAK
-28==            ------------------------------------------------------MAAMAK
-29==            --------------------------------------------P----GFPRVEPDSVI
-30==            --------------------------------------------P----GFPRVQPESVI
-31=p            --------------------------------------------P----GFPRVQPESVI
-32==            -------------------------TVKKVEKTGADTRHGASPAP---------QPKKS-
-33=p            -------------------------TVRKVEKKGAGTSLGTSSAP---------PPKKS-
-34==            TTLVASPKTEYSVVSDCNGCNSPDSTTEKKKRRAPFKSYGCSPRPERKKNRAKKLPENAN
-35=p            TTLVASPKTEYSVVSDCNGCNSPDSTTEKKKRRAPFKSYGCSPRPERKKNRAKKLPENAN
-36==            ------------------------------RRRGATARGGVGPPP---------VPAGGA
+1==             ------------------------------------------------------------
+2==             ------------------------------------------------------------
+3==             ------------------------------------------------------------
+4=p             ------------------------------------------------------------
+5=p             ------------------------------------------------------------
+6==             ------------------------------------------------------------
+7==             ------------------------------------------------------------
+8=opsin,        ------------------------------------------------------------
+9==             ------------------------------------------------------------
+10==            ------------------------------------------------------------
+11==            ------------------------------------------------------------
+12==            ------------------------------------------------------------
+13==            ------------------------------------------------------------
+14==            --------------------------------------------------MN--------
+15==            --------------------------------------------------MN--------
+16==            --------------------------------------------------MN--------
+17==            --------------------------------------------------MN--------
+18==            --------------------------------------------------MN--------
+19==            --------------------------------------------------MN--------
+20==            --------------------------------------------------MN--------
+21==            --------------------------------------------------MN--------
+22==            --------------------------------------------------MN--------
+23==            --------------------------------------------------MN--------
+24==            --------------------------------------------------MN--------
+25==            --------------------------------------------------MN--------
+26==            --------------------------------------------------MN--------
+27==            --------------------------------------------------LN--------
+28==            --------------------------------------------------LN--------
+29==            ---------------------------------PGFPRV----EPDSVIALNG-------
+30==            ---------------------------------PGFPRV----QPESVISLNG-------
+31=p            ---------------------------------PGFPRV----QPESVISLNG-------
+32==            --------------TVKKVEKTGADTRHGASPAPQPKKS-----------VNGESGSR--
+33=p            --------------TVRKVEKKGAGTSLGTSSAPPPKKS-----------LNGQPGSG--
+34==            SVVSDCNGCNSPDSTTEKKKRRAPFKSYGCSPRPERKKNRAKKLPENANGVNSNSSS---
+35=p            SVVSDCNGCNSPDSTTEKKKRRAPFKSYGCSPRPERKKNRAKKLPENANGVNSNSSS---
+36==            -------------------RRRGATARGGVGPPP---------VPAGGALVAGGGSGGIA
                                                                             
 
 1==             ------------------------------------------------------------
@@ -280,217 +280,179 @@
 11==            ------------------------------------------------------------
 12==            ------------------------------------------------------------
 13==            ------------------------------------------------------------
-14==            KMN---------------VESLRS------------------------------------
-15==            KMN---------------VDSLRS------------------------------------
-16==            KMN---------------VESLRS------------------------------------
-17==            KMN---------------VESLRS------------------------------------
-18==            KMN---------------VSTLRS------------------------------------
-19==            KMN---------------VTNLRS------------------------------------
-20==            KMN---------------VKSLRS------------------------------------
-21==            KMN---------------VKSLRS------------------------------------
-22==            KMN---------------VKSLRS------------------------------------
-23==            KMN---------------VKSLRS------------------------------------
-24==            KMN---------------VKSLRS------------------------------------
-25==            KMN---------------VASLRS------------------------------------
-26==            KMN---------------VASLRA------------------------------------
-27==            RLN---------------AKELR-------------------------------------
-28==            RLN---------------AKELR-------------------------------------
-29==            ALNG--------------IVKLQ----------------------KEVEECANLSR----
-30==            SLNG--------------VVKLQ----------------------KEVEECANLSR----
-31=p            SLNG--------------VVKLQ----------------------KEVEECANLSR----
-32==            -VNGESGSRNWRL-----GVESKAGGALCANGAVRQGDDGAALEVIEVHRVGNSKEHLPL
-33=p            -LNGQPGSGDWRR-----CAENRAVGTPCTNGAVRQGDDEATLEVIEVHRVGNSKEHLPL
-34==            GVNSNSSS----------SERLKQIQIETAEAFANGCAEEASIAMLERQ-CNNGKKISSN
-35=p            GVNSNSSS----------SERLKQIQIETAEAFANGCAEEASIAMLERQ-CNNGKKISSN
-36==            LVAGGGSGGIAAAVVAVIGRPLPTISETTTTGFTNVSSNNTS---PEKQSCANGLEADPP
+14==            --VESL------------------------------------------------------
+15==            --VDSL------------------------------------------------------
+16==            --VESL------------------------------------------------------
+17==            --VESL------------------------------------------------------
+18==            --VSTL------------------------------------------------------
+19==            --VTNL------------------------------------------------------
+20==            --VKSL------------------------------------------------------
+21==            --VKSL------------------------------------------------------
+22==            --VKSL------------------------------------------------------
+23==            --VKSL------------------------------------------------------
+24==            --VKSL------------------------------------------------------
+25==            --VASL------------------------------------------------------
+26==            --VASL------------------------------------------------------
+27==            --AKEL------------------------------------------------------
+28==            --AKEL------------------------------------------------------
+29==            --IVKL----------------------QK---------EVEECAN--------------
+30==            --VVKL----------------------QK---------EVEECAN--------------
+31=p            --VVKL----------------------QK---------EVEECAN--------------
+32==            -------NWRLGVESKAGGALCANGAVRQGDDGAALEVIEVHRVGNSKEHLPLPSEAG--
+33=p            -------DWRRCAENRAVGTPCTNGAVRQGDDEATLEVIEVHRVGNSKEHLPLPSESG--
+34==            -------SERLKQIQIETAEAFANGCA----EEASIAMLERQ-CNNGKKISSNDTPYS--
+35=p            -------SERLKQIQIETAEAFANGCA----EEASIAMLERQ-CNNGKKISSNDTPYS--
+36==            AAVVAVIGRPLPTISETTTTGFTNVSS----NNTSP---EKQSCANGLEADPPTTGYGAV
                                                                             
 
-1==             --------------------ESASTQK------AEKEVTRMVVLMVIGFLVCWVPYASVA
-2==             --------------------ESATTQK------AEKEVTRMVIIMVIFFLICWLPYASVA
-3==             --------------------ESATTQK------AEKEVTRMVILMVLGFMLAWTPYAVVA
-4=p             --------------------DSASTQK------AEREVTKMVILMVFGFLIAWTPYATVA
-5=p             --------------------DSASTQK------AEREVTKMVILMVLGFLVAWTPYATVA
-6==             --------------------DSASTQK------AEREVTKMVVVMVLGFLVCWAPYASFS
-7==             --------------------ESATTQK------AEREVSRMVVVMVGSFCVCYVPYAAFA
-8=opsin,        --------------------ESESTQK------AEKEVTRMVVVMVLAFC----------
-9==             --------------------ESESTQK------AEKEVTRMVVVMVLAFCFCWGPYAFFA
-10==            --------------------ESESTQK------AEKEVTRMVVVMIFAYCVCWGPYTFFA
-11==            --------------------ESESTQK------AEREVSRMVVVMIVAFCICWGPYASFV
-12==            --------------------ESESTQK------AEKEVSRMVVVMIVAYCFCWGPYTFFA
-13==            --------------------EADTTQR------AEREVTRMVIVMVMAFLLCWLPYSTFA
-14==            -------------------NVDKNKET------AEIRIAKAAITICFLFFCSWTPYGVMS
-15==            -------------------NVDKSKEA------AEIRIAKAAITICFLFFASWTPYGVMS
-16==            -------------------NVDKSKET------AEIRIAKAAITICFLFFVSWTPYGVMS
-17==            -------------------NVDKSKET------AEIRIAKAAITICFLFFVSWTPYGVMS
-18==            --------------------NEADAQR------AEIRIAKTALVNVSLWFICWTPYALIS
-19==            --------------------NEAETQR------AEIRIAKTALVNVSLWFICWTPYAAIT
-20==            --------------------SEDAEKS------AEGKLAKVALVTITLWFMAWTPYLVIN
-21==            --------------------SEDAEKS------AEGKLAKVALVTITLWFMAWTPYLVIN
-22==            --------------------SEDADKS------AEGKLAKVALVTISLWFMAWTPYLVIN
-23==            --------------------SEDCDKS------AEGKLAKVALTTISLWFMAWTPYLVIC
-24==            --------------------SEDCDKS------AENKLAKVALTTISLWFMAWTPYLIIC
-25==            --------------------SENQNTS------AECKLAKVALMTISLWFMAWTPYLVIN
-26==            -------------------NADQQKQS------AECRLAKVAMMTVGLWFMAWTPYLIIS
-27==            --------------------KAQAGAS------AEMKLAKISMVIITQFMLSWSPYAIIA
-28==            --------------------KAQAGAN------AEMRLAKISIVIVSQFLLSWSPYAVVA
-29==            --------------LLKHERKNISIFK------REQKAATTLGIIVGAFTVCWLPFFLLS
-30==            --------------LLKHERKNISIFK------REQKAATTLGIIVGAFTVCWLPFFLLS
-31=p            --------------LLKHERKNISIFK------REQKAATTLGIIVGAFTVCWLPFFLLS
-32==            PSEAG--PTPCAPASFERKNERNAEAKRKMALARERKTVKTLGIIMGTFILCWLPFFIVA
-33=p            PSESG--SNSYAPACLERKNERNAEAKRKMALARERKTVKTLGIIMGTFILCWLPFFIVA
-34==            DTPYS-------------RTREKLELK------RERKAARTLAIITGAFLICWLPFFIIA
-35=p            DTPYS-------------RTREKLELK------RERKAARTLAIITGAFLICWLPFFIIA
-36==            TTGYGAVAAAYYPSLVRRKPKEAADSK------RERKAAKTLAIITGAFVACWLPFFVLA
-                                                  * .           :           
+1==             -------------ESASTQK------AEKEVTRMVVLMVIGFLVCWVPYASVAFYIFT-H
+2==             -------------ESATTQK------AEKEVTRMVIIMVIFFLICWLPYASVAMYIFT-H
+3==             -------------ESATTQK------AEKEVTRMVILMVLGFMLAWTPYAVVAFWIFT-N
+4=p             -------------DSASTQK------AEREVTKMVILMVFGFLIAWTPYATVAAWIFF-N
+5=p             -------------DSASTQK------AEREVTKMVILMVLGFLVAWTPYATVAAWIFF-N
+6==             -------------DSASTQK------AEREVTKMVVVMVLGFLVCWAPYASFSLWIVS-H
+7==             -------------ESATTQK------AEREVSRMVVVMVGSFCVCYVPYAAFAMYMVN-N
+8=opsin,        -------------ESESTQK------AEKEVTRMVVVMVLAFC-----------------
+9==             -------------ESESTQK------AEKEVTRMVVVMVLAFCFCWGPYAFFACFAAA-N
+10==            -------------ESESTQK------AEKEVTRMVVVMIFAYCVCWGPYTFFACFAAA-N
+11==            -------------ESESTQK------AEREVSRMVVVMIVAFCICWGPYASFVSFAAA-N
+12==            -------------ESESTQK------AEKEVSRMVVVMIVAYCFCWGPYTFFACFAAA-N
+13==            -------------EADTTQR------AEREVTRMVIVMVMAFLLCWLPYSTFALVVAT-H
+14==            ----------RSNVDKNKET------AEIRIAKAAITICFLFFCSWTPYGVMSLIGAF-G
+15==            ----------RSNVDKSKEA------AEIRIAKAAITICFLFFASWTPYGVMSLIGAF-G
+16==            ----------RSNVDKSKET------AEIRIAKAAITICFLFFVSWTPYGVMSLIGAF-G
+17==            ----------RSNVDKSKET------AEIRIAKAAITICFLFFVSWTPYGVMSLIGAF-G
+18==            ----------RS-NEADAQR------AEIRIAKTALVNVSLWFICWTPYALISLKGVM-G
+19==            ----------RS-NEAETQR------AEIRIAKTALVNVSLWFICWTPYAAITIQGLL-G
+20==            ----------RS-SEDAEKS------AEGKLAKVALVTITLWFMAWTPYLVINCMGLF-K
+21==            ----------RS-SEDAEKS------AEGKLAKVALVTITLWFMAWTPYLVINCMGLF-K
+22==            ----------RS-SEDADKS------AEGKLAKVALVTISLWFMAWTPYLVINCMGLF-K
+23==            ----------RS-SEDCDKS------AEGKLAKVALTTISLWFMAWTPYLVICYFGLF-K
+24==            ----------RS-SEDCDKS------AENKLAKVALTTISLWFMAWTPYLIICYFGLF-K
+25==            ----------RS-SENQNTS------AECKLAKVALMTISLWFMAWTPYLVINFSGIF-N
+26==            ----------RANADQQKQS------AECRLAKVAMMTVGLWFMAWTPYLIISWAGVF-S
+27==            ----------R--KAQAGAS------AEMKLAKISMVIITQFMLSWSPYAIIALLAQF-G
+28==            ----------R--KAQAGAN------AEMRLAKISIVIVSQFLLSWSPYAVVALLAQF-G
+29==            ----LSRLLKHERKNISIFK------REQKAATTLGIIVGAFTVCWLPFFLLSTARPFIC
+30==            ----LSRLLKHERKNISIFK------REQKAATTLGIIVGAFTVCWLPFFLLSTARPFIC
+31=p            ----LSRLLKHERKNISIFK------REQKAATTLGIIVGAFTVCWLPFFLLSTARPFIC
+32==            PTPCAPASFERKNERNAEAKRKMALARERKTVKTLGIIMGTFILCWLPFFIVALVLPF-C
+33=p            SNSYAPACLERKNERNAEAKRKMALARERKTVKTLGIIMGTFILCWLPFFIVALVLPF-C
+34==            -----------RTREKLELK------RERKAARTLAIITGAFLICWLPFFIIALIGPF-V
+35=p            -----------RTREKLELK------RERKAARTLAIITGAFLICWLPFFIIALIGPF-V
+36==            AAAYYPSLVRRKPKEAADSK------RERKAAKTLAIITGAFVACWLPFFVLAILVPT-C
+                                           * .           :                  
 
-1==             FYIFT-HQGS--DFGATFMTLPAFFAKSSALYNPVIYILMNKQFRNCMITTLCC------
-2==             MYIFT-HQGS--NFGPIFMTLPAFFAKTASIYNPIIYIMMNKQFRNCMLTSLCC------
-3==             FWIFT-NKGA--DFTATLMAVPAFFSKSSSLYNPIIYVLMNKQFRNCMITTICC------
-4=p             AWIFF-NKGA--DFSAKFMAIPAFFSKSSALYNPVIYVLLNKQFRNCMLTTIFC------
-5=p             AWIFF-NKGA--AFSAQFMAIPAFFSKTSALYNPVIYVLLNKQFRSCMLTTLFC------
-6==             LWIVS-HRGE--EFDLRMATIPSCLSKASTVYNPVIYVLMNKQFRSCMM-KMVC------
-7==             MYMVN-NRNH--GLDLRLVTIPSFFSKSACIYNPIIYCFMNKQFQACIM-KMVC------
+1==             QGS--DFGATFMTLPAFFAKSSALYNPVIYILMNKQFRNCMITTLCC--------GKNPL
+2==             QGS--NFGPIFMTLPAFFAKTASIYNPIIYIMMNKQFRNCMLTSLCC--------GKNPL
+3==             KGA--DFTATLMAVPAFFSKSSSLYNPIIYVLMNKQFRNCMITTICC--------GKNPF
+4=p             KGA--DFSAKFMAIPAFFSKSSALYNPVIYVLLNKQFRNCMLTTIFC--------GKNPL
+5=p             KGA--AFSAQFMAIPAFFSKTSALYNPVIYVLLNKQFRSCMLTTLFC--------GKNPL
+6==             RGE--EFDLRMATIPSCLSKASTVYNPVIYVLMNKQFRSCMM-KMVC--------GKN-I
+7==             RNH--GLDLRLVTIPSFFSKSACIYNPIIYCFMNKQFQACIM-KMVC--------GKA-M
 8=opsin,        ------------------------------------------------------------
-9==             CFAAA-NPGY--PFHPLMAALPAFFAKSATIYNPVIYVFMNRQFRNCIL-QLF-------
-10==            CFAAA-NPGY--AFHPLMAALPAYFAKSATIYNPVIYVFMNRQFRNCIL-QLF-------
-11==            SFAAA-NPGY--AFHPLAAALPAYFAKSATIYNPVIYVFMNRQFRNCIM-QLF-------
-12==            CFAAA-NPGY--AFHPLAAALPAYFAKSATIYNPIIYVFMNRQFRNCIL-QLF-------
-13==            LVVAT-HKGI--IIQPVLASLPSYFSKTATVYNPIIYVFMNKQFQSCLL-EMLCCGY---
-14==            LIGAF-GDKT--LLTPGATMIPACACKMVACIDPFVYAISHPRYRMELQKRCPWLAL---
-15==            LIGAF-GDKT--LLTPGATMIPACTCKMVACIDPFVYAISHPRYRMELQKRCPWLAI---
-16==            LIGAF-GDKS--LLTQGATMIPACTCKLVACIDPFVYAISHPRYRLELQKRCPWLGV---
-17==            LIGAF-GDKS--LLTPGATMIPACTCKLVACIEPFVYAISHPRYRMELQKRCPWLGV---
-18==            LKGVM-GDTS--GITPLVSTLPALLAKSCSCYNPFVYAISHPKYRLAITQHLPWFCV---
-19==            IQGLL-GNAE--GITPLLTTLPALLAKSCSCYNPFVYAISHPKFRLAITQHLPWFCV---
-20==            CMGLF-KF-E--GLTPLNTIWGACFAKSAACYNPIVYGISHPKYRLALKEKCPCCVF---
-21==            CMGLF-KF-E--GLTPLNTIWGACFAKSAACYNPIVYGISHPKYRLALKEKCPCCVF---
-22==            CMGLF-KF-E--GLTPLNTIWGACFAKSAACYNPIVYGISHPKYRLALKEKCPCCVF---
-23==            YFGLF-KI-D--GLTPLTTIWGATFAKTSAVYNPIVYGISHPKYRIVLKEKCPMCVF---
-24==            YFGLF-KI-D--GLTPLTTIWGATFAKTSAVYNPIVYGISHPNDRLVLKEKCPMCVC---
-25==            FSGIF-NL-V--KISPLFTIWGSLFAKANAVYNPIVYGISHPKYRAALFAKFPSLAC---
-26==            WAGVF-SSGT--RLTPLATIWGSVFAKANSCYNPIVYGISHPRYKAALYQRFPSLAC---
-27==            LLAQF-GPAE--WVTPYAAELPVLFAKASAIHNPIVYSVSHPKFREAIQTTFPWLLTCCQ
-28==            LLAQF-GPLE--WVTPYAAQLPVMFAKASAIHNPMIYSVSHPKFREAISQTFPWVLTCCQ
-29==            TARPFICGTSCSCIPLWVERTFLWLGYANSLINPFIYAFFNRDLRTTYRSLLQC------
-30==            TARPFICGTSCSCIPLWVERTCLWLGYANSLINPFIYAFFNRDLRPTSRSLLQC------
-31=p            TARPFICGTSCSCIPLWVERTCLWLGYANSLINPFIYAFFNRDLRTTYRSLLQC------
-32==            LVLPF-CESSC-HMPTLLGAIINWLGYSNSLLNPVIYAYFNKDFQNAFKKIIKC------
-33=p            LVLPF-CESSC-HMPALLGAIINWLGYSNSLLNPVIYAYFNKDFQNAFKKIIKC------
-34==            LIGPF-VDPE--GIPPFARSFVLWLGYFNSLLNPIIYTIFSPEFRSAFQKILFG------
-35=p            LIGPF-VDPE--GIPPFARSFVLWLGYFNSLLNPIIYTIFSPEFRSAFQKILFG------
-36==            ILVPT-CDCE---VSPVLTSLSLWLGYFNSTLNPVIYTVFSPEFRHAFQRLLCG------
+9==             PGY--PFHPLMAALPAFFAKSATIYNPVIYVFMNRQFRNCIL-QLF---------GKK-V
+10==            PGY--AFHPLMAALPAYFAKSATIYNPVIYVFMNRQFRNCIL-QLF---------GKK-V
+11==            PGY--AFHPLAAALPAYFAKSATIYNPVIYVFMNRQFRNCIM-QLF---------GKK-V
+12==            PGY--AFHPLAAALPAYFAKSATIYNPIIYVFMNRQFRNCIL-QLF---------GKK-V
+13==            KGI--IIQPVLASLPSYFSKTATVYNPIIYVFMNKQFQSCLL-EMLCCGY----QPQR-T
+14==            DKT--LLTPGATMIPACACKMVACIDPFVYAISHPRYRMELQKRCPWLAL---------N
+15==            DKT--LLTPGATMIPACTCKMVACIDPFVYAISHPRYRMELQKRCPWLAI---------S
+16==            DKS--LLTQGATMIPACTCKLVACIDPFVYAISHPRYRLELQKRCPWLGV---------N
+17==            DKS--LLTPGATMIPACTCKLVACIEPFVYAISHPRYRMELQKRCPWLGV---------N
+18==            DTS--GITPLVSTLPALLAKSCSCYNPFVYAISHPKYRLAITQHLPWFCV------HE-T
+19==            NAE--GITPLLTTLPALLAKSCSCYNPFVYAISHPKFRLAITQHLPWFCV------HE-K
+20==            F-E--GLTPLNTIWGACFAKSAACYNPIVYGISHPKYRLALKEKCPCCVF------GK-V
+21==            F-E--GLTPLNTIWGACFAKSAACYNPIVYGISHPKYRLALKEKCPCCVF------GK-V
+22==            F-E--GLTPLNTIWGACFAKSAACYNPIVYGISHPKYRLALKEKCPCCVF------GK-V
+23==            I-D--GLTPLTTIWGATFAKTSAVYNPIVYGISHPKYRIVLKEKCPMCVF------GN-T
+24==            I-D--GLTPLTTIWGATFAKTSAVYNPIVYGISHPNDRLVLKEKCPMCVC------GT-T
+25==            L-V--KISPLFTIWGSLFAKANAVYNPIVYGISHPKYRAALFAKFPSLAC-------A-A
+26==            SGT--RLTPLATIWGSVFAKANSCYNPIVYGISHPRYKAALYQRFPSLAC------GS-G
+27==            PAE--WVTPYAAELPVLFAKASAIHNPIVYSVSHPKFREAIQTTFPWLLTCCQFDEKE-C
+28==            PLE--WVTPYAAQLPVMFAKASAIHNPMIYSVSHPKFREAISQTFPWVLTCCQFDDKE-T
+29==            GTSCSCIPLWVERTFLWLGYANSLINPFIYAFFNRDLRTTYRSLLQCQYR----NINR--
+30==            GTSCSCIPLWVERTCLWLGYANSLINPFIYAFFNRDLRPTSRSLLQCQYR----NINR--
+31=p            GTSCSCIPLWVERTCLWLGYANSLINPFIYAFFNRDLRTTYRSLLQCQYR----NINR--
+32==            ESSC-HMPTLLGAIINWLGYSNSLLNPVIYAYFNKDFQNAFKKIIKCKFC----RQ----
+33=p            ESSC-HMPALLGAIINWLGYSNSLLNPVIYAYFNKDFQNAFKKIIKCKFC----RR----
+34==            DPE--GIPPFARSFVLWLGYFNSLLNPIIYTIFSPEFRSAFQKILFGKYR----RGHR--
+35=p            DPE--GIPPFARSFVLWLGYFNSLLNPIIYTIFSPEFRSAFQKILFGKYR----RGHR--
+36==            DCE---VSPVLTSLSLWLGYFNSTLNPVIYTVFSPEFRHAFQRLLCGRRV----RRRR--
                                                                             
 
-1==             --GKNPLGDDE--SGASTSKTEVSSVS-TSPVS---------------------------
-2==             --GKNPLGDDE--ASATASKTE------TSQVA---------------------------
-3==             --GKNPFGDEDVSSTVSQSKTEVSSVS-SSQVS---------------------------
-4=p             --GKNPLGDDE-SSTVSTSKTEVSS------VS---------------------------
-5=p             --GKNPLGDEE-SSTVSTSKTEVSS------VS---------------------------
-6==             --GKN-IEEDE--ASTSSQVTQVSS------VA---------------------------
-7==             --GKA-MTDES--DTCSSQKTEVSTVS-STQVG---------------------------
+1==             GDDE--SGASTSKTEVSSVS-TSPVSPA--------------------------------
+2==             GDDE--ASATASKTE------TSQVAPA--------------------------------
+3==             GDEDVSSTVSQSKTEVSSVS-SSQVSPA--------------------------------
+4=p             GDDE-SSTVSTSKTEVSS------VSPA--------------------------------
+5=p             GDEE-SSTVSTSKTEVSS------VSPA--------------------------------
+6==             EEDE--ASTSSQVTQVSS------VAPEK-------------------------------
+7==             TDES--DTCSSQKTEVSTVS-STQVGPN--------------------------------
 8=opsin,        ------------------------------------------------------------
-9==             --GKK-VDDGS--ELSSASKTEVSSV---SSVS---------------------------
-10==            --GKK-VDDGS--ELSSASKTEVSSV---SSVS---------------------------
-11==            --GKK-VDDGS--EASTTSRTEVSSVS-NSSVA---------------------------
-12==            --GKK-VDDGS--EVST-SRTEVSSVS-NSSVS---------------------------
-13==            -QPQR-TGKAS--PGTPGPHADVTAAGLRNKVM---------------------------
-14==            ---NE-KAPES----SAVASTSTTQEPQQTTAA---------------------------
-15==            ---SE-KAPES----RAAISTSTTQEQQQTTAA---------------------------
-16==            ---NE-KSGEI----SSAQSTTTQEQ-QQTTAA---------------------------
-17==            ---NE-KSGEA----SSAQSTTTQEQTQQTSAA---------------------------
-18==            ---HE-TETKS-NDDSQSNSTVAQDKA---------------------------------
-19==            ---HE-KDPND-VEENQSSNTQTQEKS---------------------------------
-20==            ---GK-VDDGK-SSDAQSQATASEAESKA-------------------------------
-21==            ---GK-VDDGK-SSDAQSQATASEAESKA-------------------------------
-22==            ---GK-VDDGK-SSEAQSQATTSEAESKA-------------------------------
-23==            ---GN-TDEPKPDAPASDTETTSEADSKA-------------------------------
-24==            ---GT-TDEPKPDAPPSDTETTSEAESKD-------------------------------
-25==            ----A-AEPSS-DAVSTTSGTTTVTDNEKSNA----------------------------
-26==            ---GS-GESGS-DVKSEASATTTMEEKPKIPEA---------------------------
-27==            FDEKE-CEDAN-DAEEEVVASER--GGESRDAAQMKEMMAMMQKMQAQQAAYQPPPPPQG
-28==            FDDKE-TEDDK-DAETEIPAGESSDAAPSADAAQMKEMMAMMQKMQQQQAAY----PPQG
-29==            ---QY-RNINR--KLSAAGMHEALKLAER-------------------------------
-30==            ---QY-RNINR--KLSAAGMHEALKLAER-------------------------------
-31=p            ---QY-RNINR--KLSAAGMHEALKLAER-------------------------------
-32==            ---KF-CRQ---------------------------------------------------
-33=p            ---KF-CRR---------------------------------------------------
-34==            ---KY-RRGHR-------------------------------------------------
-35=p            ---KY-RRGHR-------------------------------------------------
-36==            ---RR-VRRRR--A----------------------------------------------
-                                                                            
-
-1==             -----------------------------------PA-----------------------
-2==             -----------------------------------PA-----------------------
-3==             -----------------------------------PA-----------------------
-4=p             -----------------------------------PA-----------------------
-5=p             -----------------------------------PA-----------------------
-6==             -----------------------------------PEK----------------------
-7==             -----------------------------------PN-----------------------
-8=opsin,        ------------------------------------------------------------
-9==             -----------------------------------PA-----------------------
-10==            -----------------------------------PA-----------------------
-11==            -----------------------------------PA-----------------------
-12==            -----------------------------------PA-----------------------
-13==            -----------------------------------PAHPV--------------------
-14==            ------------------------------------------------------------
-15==            ------------------------------------------------------------
-16==            ------------------------------------------------------------
-17==            ------------------------------------------------------------
-18==            ------------------------------------------------------------
-19==            ------------------------------------------------------------
-20==            ------------------------------------------------------------
-21==            ------------------------------------------------------------
-22==            ------------------------------------------------------------
-23==            ------------------------------------------------------------
-24==            ------------------------------------------------------------
-25==            ------------------------------------------------------------
-26==            ------------------------------------------------------------
-27==            Y--PPQGYPPQGAYPPPQGYPPQGYPPQGYPPQGYPPQGAPPQVEAPQGAPPQGVDNQAY
-28==            YAPPPQGYPPQGY--PPQGYPPQGYPPQGYPP---PPQGAPPQ-GAPPAAPPQGVDNQAY
-29==            -----------------------------------PERPEFVL-QNADYCRKKGHDS---
-30==            -----------------------------------PERSEFVL-QNSDHCGKKGHDT---
-31=p            -----------------------------------PERSEFVL-QNSDHCGKKGHDT---
+9==             DDGS--ELSSASKTEVSSV---SSVSPA--------------------------------
+10==            DDGS--ELSSASKTEVSSV---SSVSPA--------------------------------
+11==            DDGS--EASTTSRTEVSSVS-NSSVAPA--------------------------------
+12==            DDGS--EVST-SRTEVSSVS-NSSVSPA--------------------------------
+13==            GKAS--PGTPGPHADVTAAGLRNKVMPAHPV-----------------------------
+14==            EKAP--ESSAVASTSTTQEP--QQTTAA--------------------------------
+15==            EKAP--ESRAAISTSTTQEQ--QQTTAA--------------------------------
+16==            EKSG--EISSAQST-TTQEQ--QQTTAA--------------------------------
+17==            EKSG--EASSAQST-TTQEQ-TQQTSAA--------------------------------
+18==            ETKS--NDDSQSNSTVAQDK-A--------------------------------------
+19==            DPND--VEENQSSNTQTQEK-S--------------------------------------
+20==            DDGK--SSDAQSQA-TASEA-ESKA-----------------------------------
+21==            DDGK--SSDAQSQA-TASEA-ESKA-----------------------------------
+22==            DDGK--SSEAQSQA-TTSEA-ESKA-----------------------------------
+23==            DEPK--PDAPASDTETTSEA-DSKA-----------------------------------
+24==            DEPK--PDAPPSDTETTSEA-ESKD-----------------------------------
+25==            EPSS--DAVSTTSGTTTVTD-NEKSNA---------------------------------
+26==            ESGS--DVKSEASATTTMEE-KPKIPEA--------------------------------
+27==            EDAN--DAEEEVVASER--G-GESRDAAQMKEMMAMMQKMQAQQAAYQPPPPPQGY--PP
+28==            EDDK--DAETEIPAGESSDA-APSADAAQMKEMMAMMQKMQQQQAAY----PPQGYAPPP
+29==            ------KLSAAGMHEALKLAERPERPEF------------VLQNADY-------------
+30==            ------KLSAAGMHEALKLAERPERSEF------------VLQNSDH-------------
+31=p            ------KLSAAGMHEALKLAERPERSEF------------VLQNSDH-------------
 32==            ------------------------------------------------------------
 33=p            ------------------------------------------------------------
 34==            ------------------------------------------------------------
 35=p            ------------------------------------------------------------
-36==            -----------------------------------PQ-----------------------
+36==            ------A---------------PQ------------------------------------
                                                                             
 
-1==             --
-2==             --
-3==             --
-4=p             --
-5=p             --
-6==             --
-7==             --
-8=opsin,        --
-9==             --
-10==            --
-11==            --
-12==            --
-13==            --
-14==            --
-15==            --
-16==            --
-17==            --
-18==            --
-19==            --
-20==            --
-21==            --
-22==            --
-23==            --
-24==            --
-25==            --
-26==            --
-27==            QA
-28==            QA
-29==            --
-30==            --
-31=p            --
-32==            --
-33=p            --
-34==            --
-35=p            --
-36==            --
-                  
+1==             ---------------------------------------------------------
+2==             ---------------------------------------------------------
+3==             ---------------------------------------------------------
+4=p             ---------------------------------------------------------
+5=p             ---------------------------------------------------------
+6==             ---------------------------------------------------------
+7==             ---------------------------------------------------------
+8=opsin,        ---------------------------------------------------------
+9==             ---------------------------------------------------------
+10==            ---------------------------------------------------------
+11==            ---------------------------------------------------------
+12==            ---------------------------------------------------------
+13==            ---------------------------------------------------------
+14==            ---------------------------------------------------------
+15==            ---------------------------------------------------------
+16==            ---------------------------------------------------------
+17==            ---------------------------------------------------------
+18==            ---------------------------------------------------------
+19==            ---------------------------------------------------------
+20==            ---------------------------------------------------------
+21==            ---------------------------------------------------------
+22==            ---------------------------------------------------------
+23==            ---------------------------------------------------------
+24==            ---------------------------------------------------------
+25==            ---------------------------------------------------------
+26==            ---------------------------------------------------------
+27==            QGYPPQGAYPPPQGYPPQGYPPQGYPPQGYPPQGAPPQVEAPQGAPPQGVDNQAYQA
+28==            QGYPPQGY--PPQGYPPQGYPPQGYPP---PPQGAPPQ-GAPPAAPPQGVDNQAYQA
+29==            --------------------------------------------CRKKGHDS-----
+30==            --------------------------------------------CGKKGHDT-----
+31=p            --------------------------------------------CGKKGHDT-----
+32==            ---------------------------------------------------------
+33=p            ---------------------------------------------------------
+34==            ---------------------------------------------------------
+35=p            ---------------------------------------------------------
+36==            ---------------------------------------------------------
+