Mercurial > repos > rnateam > mafft
changeset 7:aaefa93c2dd2 draft
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/mafft commit eff9db2cd18c82a7de37851571b8989b48014c71"
author | rnateam |
---|---|
date | Wed, 15 Apr 2020 15:33:37 -0400 |
parents | c5908940967d |
children | 4de39704d423 |
files | macros.xml mafft-add.xml mafft.xml test-data/add_seq.fa test-data/mafft_add_result.aln test-data/mafft_custom_result.aln test-data/mafft_fftns_result.aln test-data/mafft_nwns_result.aln |
diffstat | 8 files changed, 2173 insertions(+), 1137 deletions(-) [+] |
line wrap: on
line diff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/macros.xml Wed Apr 15 15:33:37 2020 -0400 @@ -0,0 +1,16 @@ +<?xml version="1.0"?> +<macros> + <token name="@VERSION@">1</token> + <token name="@TOOL_VERSION@">7.455</token> + <xml name="requirements"> + <requirements> + <requirement type="package" version="7.455">mafft</requirement> + <requirement type="package" version="36.3.8">fasta3</requirement> + </requirements> + </xml> + <xml name="citations"> + <citations> + <citation type="doi">10.1093/molbev/mst010</citation> + </citations> + </xml> +</macros>
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/mafft-add.xml Wed Apr 15 15:33:37 2020 -0400 @@ -0,0 +1,88 @@ +<?xml version="1.0" encoding="UTF-8"?> +<tool id="rbc_mafft_add" name="MAFFT add" version="@TOOL_VERSION@+galaxy@VERSION@"> + <description>Align a sequence,alignment or fragments to an existing alignment.</description> + <macros> + <import>macros.xml</import> + </macros> + <expand macro="requirements" /> + <stdio> + <exit_code range="1:" level="fatal" description="Error occurred. Please check Tool Standard Error" /> + <exit_code range=":-1" level="fatal" description="Error occurred. Please check Tool Standard Error" /> + </stdio> + <version_command> <![CDATA[ + mafft --version + ]]> + </version_command> + <command> + <![CDATA[ + mafft + #if $sequences.sequenceType == 'singleseq' + $sequences.preservegap '$inputSequences' + #elif $sequences.sequenceType == 'frags' + --addfragments '$inputSequences' + #elif $sequences.sequenceType == 'group' + --addprofile '$inputSequences' + #end if + $keeplength $map $reorder + '$inputAlignment' + > '$outputAlignment' + #if $map == '--mapout' + && mv '${inputSequences}.map' '$outputmap' + #end if + ]]> + </command> + <inputs> + <param name="inputSequences" type="data" format="fasta" label="Sequences to add to the alignment" help="Amino acid or nucleotide sequences in FASTA format."/> + <param name="inputAlignment" type="data" format="fasta" label="Alignment" help="Amino acid or nucleotide sequences in aligned FASTA format."/> + <conditional name="sequences"> + <param name="sequenceType" type="select" label="What do you want to add to the alignment" > + <option value="singleseq">A single sequence</option> + <option value="frags" selected="true">Fragments</option> + <option value="group">An alignment</option> + </param> + <when value='singleseq'> + <param name="preservegap" type="select" label="Preserve the original alignment" help="Keep the given alignment unchanged (--add .)If not, the aligned letters in the seed alignment are preserved but gaps are not necessarily preserved (--seed)"> + <option value="--add" selected="true" >Yes</option> + <option value="--seed">no</option> + </param> + </when> + <when value='frags'/> + <when value='group'/> + </conditional> + <param name="keeplength" type="boolean" truevalue="--keeplength" falsevalue="" checked="True" label="Keep alignment length" help="The alignment length is unchanged. Insertions at the additional sequences are deleted" /> + <param name="map" type="boolean" truevalue="--mapout" falsevalue="" checked="False" label="Output a correspondance table of positions (--mapout)" help="Output a correspondence table of positions, sequence.map, between before and after the calculation. The --mapout option automatically turns on the --keeplength option, to keep the numbering of sites in the reference alignment" /> + <param name="reorder" type="boolean" truevalue="" falsevalue="--reorder" checked="True" label="Preserve the original order of sequences (--reorder)" /> + </inputs> + <outputs> + <data format="fasta" name="outputAlignment" label="${tool.name} on ${on_string} : New alignment"/> + <data name="outputmap" format="tabular" label="${tool.name} on ${on_string} : Correspondance of positions "> + <filter>map == True</filter> + </data> + </outputs> + <tests> + <test expect_num_outputs="1" > + <param name="inputSequences" value="add_seq.fa"/> + <param name="inputAlignment" value="mafft_fftns_result.aln"/> + <param name="sequenceType" value="singleseq"/> + <param name="preservegap" value="--add"/> + <param name="keeplength" value="--keeplength"/> + <param name="map" value=""/> + <output name="outputAlignment" ftype="fasta" file="mafft_add_result.aln"/> + </test> + </tests> + <help> + <![CDATA[ +Add one of more sequences to an existing alignment. The new sequence(s) can be complete, fragments, or another alignement. + +- Sequences in new_sequences are ungapped and then aligned to existing_alignment. +- new_sequences is a single multi-FASTA format file. +- existing_alignment is a single multi-FASTA format file. +- Gaps in existing_alignment are preserved by default (--add), but it can be deactivated (--seed). In that case the aligned letters in the seed alignment are preserved but gaps are not necessarily preserved. +- The alignment length may be conserved if the --keeplength option is given. The alignment length is unchanged. Insertions at the new sequences are deleted. +- --mapout options output a correspondence table of positions, new_sequences.map, between before and after the calculation. The --mapout option automatically turns on the --keeplength option, to keep the numbering of sites in the reference alignment. +- Omit --reorder to preserve the original sequence order. + + ]]> + </help> + <expand macro="citations" /> +</tool>
--- a/mafft.xml Sat Nov 11 15:06:34 2017 -0500 +++ b/mafft.xml Wed Apr 15 15:33:37 2020 -0400 @@ -1,229 +1,294 @@ -<tool id="rbc_mafft" name="MAFFT" version="7.221.3"> - <description>Multiple alignment program for amino acid or nucleotide sequences</description> - <requirements> - <requirement type="package" version="7.221">mafft</requirement> - </requirements> - <stdio> - <exit_code range="1:" level="fatal" description="Error occurred. Please check Tool Standard Error" /> - <exit_code range=":-1" level="fatal" description="Error occurred. Please check Tool Standard Error" /> - </stdio> - <version_command> - <![CDATA[ - mafft --version - ]]> - </version_command> - <command> - <![CDATA[ - #if $cond_flavour.flavourType != 'custom' - $cond_flavour.flavourType - #elif $cond_flavour.flavourType == 'custom' - ### full parameter options - mafft - $cond_flavour.distance_method - --retree $cond_flavour.retree - --maxiterate $cond_flavour.iterations - #end if - - ## specify threads to use - --thread \${GALAXY_SLOTS:-1} - - $datatype - --ep $ep - --op $op - $adjustdirection - - #if $matrix_condition.matrix == "BLOSUM" - --bl ${matrix_condition.BLOSUM} - #elif $matrix_condition.matrix == "PAM" - --jtt ${matrix_condition.PAM} - #end if - - $reorder - $getTree - $outputFormat - $inputSequences > $outputAlignment; - - #if $getTree == "--treeout" - mv ${inputSequences}.tree $outputTree; - #end if - ]]> - </command> - <inputs> - <param name="inputSequences" type="data" format="fasta" label="Sequences to align" help="Amino acid or nucleotide sequences in FASTA format."/> - <param name="datatype" type="select" label="Data type"> - <option value="">Auto detection</option> - <option value="--nuc">Nucleic acids</option> - <option value="--amino">Amino acids</option> - </param> - <conditional name="cond_flavour"> - <param name="flavourType" type="select" label="MAFFT flavour" help="Run mafft with pre-defined input parameters. Specification of these parameters can be found in the help section."> - <option value="mafft --auto">auto</option> - <option value="mafft-fftns" selected="true">fftns</option> - <option value="mafft-fftnsi">fftnsi</option> - <option value="mafft-nwns">nwns</option> - <option value="mafft-nwnsi">nwnsi</option> - <option value="mafft-einsi">einsi</option> - <option value="mafft-ginsi">ginsi</option> - <option value="mafft-linsi">linsi</option> - <option value="mafft-qinsi">qinsi</option> - <option value="mafft-xinsi">xinsi</option> - <option value="custom">Custom Parameters</option> - </param> - <when value="mafft-fftns"/> - <when value="mafft --auto"/> - <when value="mafft-fftnsi"/> - <when value="mafft-nwns"/> - <when value="mafft-nwnsi"/> - <when value="mafft-einsi"/> - <when value="mafft-ginsi"/> - <when value="mafft-linsi"/> - <when value="mafft-qinsi"/> - <when value="mafft-xinsi"/> - <when value="custom"> - <param name="distance_method" type="select" display="radio" label="Distance method" help="Distance method must be chosen regarding your data"> - <option value="--6merpair" selected="true">Shared 6mers distance (fastest)</option> - <option value="--globalpair">Global alignment (Needleman-Wunsch)</option> - <option value="--localpair">Local alignment (Smith-Waterman)</option> - <option value="--genafpair">Local, affine gap cost</option> - </param> - <param name="retree" type="integer" value="2" min="1" max="100" label="Guide tree is built this number of times in the progressive stage." help="Valid with 6mer distance" /> - <param name="iterations" type="integer" value="0" min="0" max="1000" label="Maximum number of iterations" help="1000 for maximum quality" /> - </when> - </conditional> - <param name="ep" type="float" value="0.123" label="Gap extend penalty" help="Offset value, which works like gap extension penalty, for group-to-group alignment. For E-INS-i, 0 is recommended to allow large gaps" /> - <param name="op" type="float" value="1.53" label="Gap opening penalty" help="1.53 default value" /> - <param name="adjustdirection" type="select" display="radio" label="Direction of nucleotide sequences" help="Generate reverse complement sequences, as necessary, and align them together with the remaining sequences"> - <option value="--adjustdirection">adjust direction</option> - <option value=" " selected="true">do not adjust direction</option> - </param> - <conditional name="matrix_condition"> - <param name="matrix" type="select" label="Matrix selection" display="radio" help="Usefull only for amino acids" > - <option value="">No matrix</option> - <option value="BLOSUM">BLOSUM</option> - <option value="PAM">PAM</option> - </param> - <when value=""/> - <when value="BLOSUM"> - <param name="BLOSUM" type="select" display="radio" label="Coefficient of the BLOSUM matrix"> - <option value="30">30</option> - <option value="45">45</option> - <option value="62" selected="true">62</option> - <option value="80">80</option> - </param> - </when> - <when value="PAM"> - <param name="PAM" type="integer" value="80" min="1" max="350" label="Coefficient of the PAM matrix" /> - </when> - </conditional> - <param name="reorder" type="boolean" truevalue="--reorder" falsevalue="" checked="False" label="Reorder output?" /> - <param name="getTree" type="boolean" truevalue="--treeout" falsevalue="" checked="False" label="Display alignment tree ?" /> - <param name="outputFormat" type="select" label="Output format" help="Either FASTA or ClustalW"> - <option value="" selected="true">FASTA</option> - <option value="--clustalout">ClustalW</option> - <option value="--phylipout">Phylip</option> - </param> - </inputs> - <outputs> - <data format="fasta" name="outputAlignment" label="${tool.name} on ${on_string}"> - <change_format> - <when input="outputFormat" value="--clustalout" format="clustal"/> - <when input="outputFormat" value="--phylipout" format="phylip"/> - </change_format> - </data> - <data name="outputTree" format="txt" label="${tool.name} Guide Tree"> - <filter>getTree == True</filter> - </data> - </outputs> - <tests> - <test> - <param name="inputSequences" value="sample.fa"/> - <param name="flavourType" value="mafft-fftns"/> - <param name="outputFormat" value=""/> - <output name="outputAlignment" ftype="fasta" file="mafft_fftns_result.aln"/> - </test> - <test> - <param name="inputSequences" value="sample.fa"/> - <param name="flavourType" value="mafft-nwns"/> - <param name="outputFormat" value="--clustalout"/> - <output name="outputAlignment" ftype="clustal" file="mafft_nwns_result.aln"/> - </test> - </tests> - <help> - <![CDATA[ -**What it does** - -MAFFT is a multiple sequence alignment program for unix-like operating systems. -It offers a range of multiple alignment methods, L-INS-i (accurate; for alignment of <∼200 sequences), -FFT-NS-2 (fast; for alignment of <∼30,000 sequences), etc. - -From the MAFFT man page, an overview of the different predefined flavours of the tool. - -**Accuracy-oriented methods:** - -- L-INS-i (probably most accurate; recommended for <200 sequences; iterative refinement method incorporating local pairwise alignment information): - - - mafft --localpair --maxiterate 1000 input [> output] - -- G-INS-i (suitable for sequences of similar lengths; recommended for <200 sequences; iterative refinement method incorporating global pairwise alignment information): - - - mafft --globalpair --maxiterate 1000 input [> output] - -- E-INS-i (suitable for sequences containing large unalignable regions; recommended for <200 sequences): - - - mafft --ep 0 --genafpair --maxiterate 1000 input [> output]. For E-INS-i, the --ep 0 option is recommended to allow large gaps. - - -**Speed-oriented methods:** - -- FFT-NS-i (iterative refinement method; two cycles only): - - - mafft --retree 2 --maxiterate 2 input [> output] - -- FFT-NS-i (iterative refinement method; max. 1000 iterations): - - - mafft --retree 2 --maxiterate 1000 input [> output] - -- FFT-NS-2 (fast; progressive method): - - - mafft --retree 2 --maxiterate 0 input [> output] - -- FFT-NS-1 (very fast; recommended for >2000 sequences; progressive method with a rough guide tree): - - - mafft --retree 1 --maxiterate 0 input [> output] - -- NW-NS-i (iterative refinement method without FFT approximation; two cycles only): - - - mafft --retree 2 --maxiterate 2 --nofft input [> output] - -- NW-NS-2 (fast; progressive method without the FFT approximation): - - - mafft --retree 2 --maxiterate 0 --nofft input [> output] - -- NW-NS-PartTree-1 (recommended for ~10,000 to ~50,000 sequences; progressive method with the PartTree algorithm): - - - mafft --retree 1 --maxiterate 0 --nofft --parttree input [> output] - -**Options:** - ---auto - Automatically selects an appropriate strategy from L-INS-i, FFT-NS-i and FFT-NS-2, according to data size. Default: off (always FFT-NS-2) ---adjustdirection - Generate reverse complement sequences, as necessary, and align them together with the remaining sequences. In the case of protein alignment, these options are just ignored. ---op - Gap opening penalty, default: 1.53 ---ep - Offset (works like gap extension penalty), default: 0.0 ---maxiterate - Maximum number of iterative refinement, default: 0 ---clustalout - Output: clustal format, default: fasta ---thread - Number of threads (if unsure, --thread -1) ---retree number - Guide tree is built number times in the progressive stage. Valid with 6mer distance. Default: 2 - ]]> - </help> - <citations> - <citation type="doi">10.1093/molbev/mst010</citation> - </citations> -</tool> +<?xml version="1.0" encoding="UTF-8"?> +<tool id="rbc_mafft" name="MAFFT" version="@TOOL_VERSION@+galaxy@VERSION@"> + <description>Multiple alignment program for amino acid or nucleotide sequences</description> + <macros> + <import>macros.xml</import> + </macros> + <expand macro="requirements" /> + <stdio> + <exit_code range="1:" level="fatal" description="Error occurred. Please check Tool Standard Error" /> + <exit_code range=":-1" level="fatal" description="Error occurred. Please check Tool Standard Error" /> + </stdio> + <version_command> <![CDATA[ + mafft --version + ]]> + </version_command> + <command> + <![CDATA[ + + #if $cond_flavour.flavourType == 'custom' + #if $cond_flavour.dist_flavour.distance_method == '--fastapair' + export FASTA_4_MAFFT=`which fasta36`; + #end if + #end if + + #if $cond_flavour.flavourType != 'custom' + $cond_flavour.flavourType + #elif $cond_flavour.flavourType == 'custom' + ### full parameter options + mafft + $cond_flavour.dist_flavour.distance_method + #if $cond_flavour.dist_flavour.distance_method == '--6merpair' + --retree $cond_flavour.dist_flavour.retree + $cond_flavour.dist_flavour.distance_method.usetree.parttree + + #if $cond_flavour.dist_flavour.distance_method.usetree.parttree==--parttree + $cond_flavour.dist_flavour.distance_method.usetree.treedistance + $cond_flavour.dist_flavour.distance_method.usetree.partsize + $cond_flavour.dist_flavour.distance_method.usetree.groupsize + #end if + + #elif $cond_flavour.dist_flavour.distance_method == '--globalpair' + --weighti $cond_flavour.dist_flavour.weighti + #elif $cond_flavour.dist_flavour.distance_method == '--localpair' + --weighti $cond_flavour.dist_flavour.weighti + --lop $cond_flavour.dist_flavour.lop + --lep $cond_flavour.dist_flavour.lep + --lexp $cond_flavour.dist_flavour.lexp + #elif $cond_flavour.dist_flavour.distance_method == '--genafpair' + --weighti $cond_flavour.dist_flavour.weighti + --lop $cond_flavour.dist_flavour.lop + --lep $cond_flavour.dist_flavour.lep + --lexp $cond_flavour.dist_flavour.lexp + --LOP $cond_flavour.dist_flavour.skipLOP + --EXP $cond_flavour.dist_flavour.skipEXP 1 + #elif $cond_flavour.dist_flavour.distance_method == '--fastapair' + --weighti $cond_flavour.dist_flavour.weighti + #end if + --maxiterate $cond_flavour.iterations + $cond_flavour.fft + $cond_flavour.score + #end if + + ## specify threads to use + --thread \${GALAXY_SLOTS:-1} + $datatype + --ep $ep + --op $op + + #if $matrix_condition.matrix == "BLOSUM" + --bl $matrix_condition.BLOSUM + #elif $matrix_condition.matrix == "PAM" + --jtt $matrix_condition.PAM + --tm $matrix_condition.tm + #elif $matrix_condition.matrix == "custom" + --aamatrix '$matrix_condition.matrixfile' + --fmodel $matrix_condition.fmodel + #end if + + $reorder + $getTree + $outputFormat + '$inputSequences' > '$outputAlignment'; + + #if $getTree == "--treeout" + mv '${inputSequences}.tree' '$outputTree'; + #end if + ]]> + </command> + <inputs> + <param name="inputSequences" type="data" format="fasta" label="Sequences to align" help="Amino acid or nucleotide sequences in FASTA format."/> + <param name="datatype" type="select" label="Data type"> + <option value="">Auto detection</option> + <option value="--nuc">Nucleic acids</option> + <option value="--amino">Amino acids</option> + </param> + <conditional name="cond_flavour"> + <param name="flavourType" type="select" label="MAFFT flavour" help="Run mafft with pre-defined input parameters. Specification of these parameters can be found in the help section."> + <option value="mafft --auto">auto</option> + <option value="mafft-fftns" selected="true">fftns</option> + <option value="mafft-fftnsi">fftnsi</option> + <option value="mafft-nwns">nwns</option> + <option value="mafft-nwnsi">nwnsi</option> + <option value="mafft-einsi">einsi</option> + <option value="mafft-ginsi">ginsi</option> + <option value="mafft-linsi">linsi</option> + <option value="mafft-qinsi">qinsi</option> + <option value="mafft-xinsi">xinsi</option> + <option value="custom">Custom Parameters</option> + </param> + <when value="mafft-fftns"/> + <when value="mafft --auto"/> + <when value="mafft-fftnsi"/> + <when value="mafft-nwns"/> + <when value="mafft-nwnsi"/> + <when value="mafft-einsi"/> + <when value="mafft-ginsi"/> + <when value="mafft-linsi"/> + <when value="mafft-qinsi"/> + <when value="mafft-xinsi"/> + <when value="custom"> + <conditional name="dist_flavour"> + <param name="distance_method" type="select" display="radio" label="Distance method" help="Distance method must be chosen regarding your data"> + <option value="--6merpair" selected="true">Shared 6mers distance (fastest)</option> + <option value="--globalpair">Global alignment (Needleman-Wunsch)</option> + <option value="--localpair">Local alignment (Smith-Waterman)</option> + <option value="--genafpair">Local, affine gap cost</option> + <option value="--fastapair">All pairwise alignments are computed with FASTA</option> + </param> + <when value="--6merpair"> + <param name="retree" type="integer" value="2" min="1" max="100" label="Guide tree is built this number of times in the progressive stage." help="Valid with 6mer distance" /> + <conditional name="usetree"> + <param name="parttree" type="select" label="Use a fast tree-building method?" help="Recommended for a large number (> ~10,000) of sequences are input" > + <option value="--parttree" selected="true">Yes</option> + <option value="">No</option> + </param> + <when value="--parttree"> + <param name="treedistance" type="select" display="radio" label="Distance method" help="Distance method must be chosen regarding your data"> + <option value="--fastaparttree" selected="true">Distances based on FASTA</option> + <option value="--dpparttree">Distances based on DP. (Needleman-Wunsch)</option> + </param> + <param name="partsize" type="integer" value="50" min="0" max="1000" label="Number of partitions in the PartTree algorithm" /> + <param name="groupsize" type="integer" value="" min="0" max="1000" label="Do not make alignment larger than ... sequences" /> + </when> + <when value=""/> + </conditional> + </when> + <when value="--globalpair"> + <param name="weighti" type="float" value="2.7" min="1" max="100" label="Weighting factor for the consistency term calculated from pairwise alignments." help="Valid when either of --globalpair, --localpair, --genafpair, --fastapair or --blastpair is selected." /> + </when> + <when value="--localpair"> + <param name="weighti" type="float" value="2.7" min="1" max="100" label="Weighting factor for the consistency term calculated from pairwise alignments." help="Valid when either of --globalpair, --localpair, --genafpair, --fastapair or --blastpair is selected." /> + <param name="lop" type="float" value="-2.0" label="Gap opening penalty at local pairwise alignment" help="-2.00 default value" /> + <param name="lep" type="float" value="0.1" label="Offset value at local pairwise alignment" help="0.1 default value" /> + <param name="lexp" type="float" value="-0.1" label="Gap extension penalty at local pairwise alignment." help="-0.1 default value" /> + </when> + <when value="--genafpair"> + <param name="weighti" type="float" value="2.7" min="1" max="100" label="Weighting factor for the consistency term calculated from pairwise alignments." help="Valid when either of --globalpair, --localpair, --genafpair, --fastapair or --blastpair is selected." /> + <param name="lop" type="float" value="-2.0" label="Gap opening penalty at local pairwise alignment" help="-2.00 default value" /> + <param name="lep" type="float" value="0.1" label="Offset value at local pairwise alignment" help="0.1 default value" /> + <param name="lexp" type="float" value="-0.1" label="Gap extension penalty at local pairwise alignment." help="-0.1 default value" /> + <param name="skipLOP" type="float" value="-6.00" label="Gap opening penalty to skip the alignment" help="-6.00 default value" /> + <param name="skipEXP" type="float" value="0.00" label="Gap extension penalty to skip the alignment" help="0 default value" /> + </when> + <when value="--fastapair"> + <param name="weighti" type="float" value="2.7" min="1" max="100" label="Weighting factor for the consistency term calculated from pairwise alignments." help="Valid when either of --globalpair, --localpair, --genafpair, --fastapair or --blastpair is selected." /> + </when> + </conditional> + <param name="iterations" type="integer" value="0" min="0" max="1000" label="Maximum number of iterations" help="1000 for maximum quality" /> + <param name="fft" type="boolean" truevalue="--fft" falsevalue="--nofft" checked="True" label="Use FFT approximation in group-to-group alignment?" /> + <param name="score" type="boolean" truevalue="" falsevalue="--noscore" checked="True" label="Check alignment score in the iterative refinement stage?" /> + </when> + </conditional> + <param name="ep" type="float" value="0.0" label="Gap extend penalty for group-to-group alignment" help="Offset value, which works like gap extension penalty, for group-to-group alignment. For E-INS-i, 0 is recommended to allow large gaps" /> + <param name="op" type="float" value="1.53" label="Gap opening penalty at group-to-group alignment." help="1.53 default value" /> + <conditional name="matrix_condition"> + <param name="matrix" type="select" label="Matrix selection" display="radio" help="Usefull only for amino acids" > + <option value="">No matrix</option> + <option value="BLOSUM" selected="true">BLOSUM</option> + <option value="PAM">PAM</option> + <option value="custom">Custom</option> + </param> + <when value=""/> + <when value="BLOSUM"> + <param name="BLOSUM" type="select" display="radio" label="Coefficient of the BLOSUM matrix"> + <option value="30">30</option> + <option value="45">45</option> + <option value="62" selected="true">62</option> + <option value="80">80</option> + </param> + </when> + <when value="PAM"> + <param name="PAM" type="integer" value="80" min="1" max="350" label="Coefficient of the JTT PAM matrix" /> + <param name="tm" type="integer" value="80" min="1" max="350" label="Coefficient of the transmembrane PAM matrix" /> + </when> + <when value="custom"> + <param name="matrixfile" type="data" format="txt" label="User-defined AA scoring matrix" help="The format of matrixfile is the same to that of BLAST. Ignored when nucleotide sequences are input."/> + <param name="fmodel" type="boolean" truevalue="--fmodel" falsevalue="" checked="False" label="Incorporate the AA/nuc composition information into the scoring matrix?" /> + </when> + </conditional> + <param name="reorder" type="boolean" truevalue="--reorder" falsevalue="" checked="False" label="Reorder output?" /> + <param name="getTree" type="boolean" truevalue="--treeout" falsevalue="" checked="False" label="Display alignment tree ?" /> + <param name="outputFormat" type="select" label="Output format" help="Either FASTA or ClustalW"> + <option value="" selected="true">FASTA</option> + <option value="--clustalout">ClustalW</option> + <option value="--phylipout">Phylip</option> + </param> + </inputs> + <outputs> + <data format="fasta" name="outputAlignment" label="${tool.name} on ${on_string}"> + <change_format> + <when input="outputFormat" value="--clustalout" format="clustal"/> + <when input="outputFormat" value="--phylipout" format="phylip"/> + </change_format> + </data> + <data name="outputTree" format="txt" label="${tool.name} Guide Tree"> + <filter>getTree == True</filter> + </data> + </outputs> + <tests> + <test expect_num_outputs="1" > + <param name="inputSequences" value="sample.fa"/> + <param name="flavourType" value="mafft-fftns"/> + <param name="outputFormat" value=""/> + <output name="outputAlignment" ftype="fasta" file="mafft_fftns_result.aln"/> + </test> + <test expect_num_outputs="1" > + <param name="inputSequences" value="sample.fa"/> + <param name="flavourType" value="mafft-nwns"/> + <param name="outputFormat" value="--clustalout"/> + <output name="outputAlignment" ftype="clustal" file="mafft_nwns_result.aln"/> + </test> + <test expect_num_outputs="1" > + <param name="inputSequences" value="sample.fa"/> + <param name="flavourType" value="custom"/> + <param name="matrix_condition" value="BLOSUM"/> + <param name="BLOSUM" value="62"/> + <param name="distance_method" value="--fastapair"/> + <param name="weighti" value="2.7"/> + <param name="iterations" value="1000"/> + <param name="outputFormat" value="--clustalout"/> + <output name="outputAlignment" ftype="clustal" file="mafft_custom_result.aln"/> + </test> + </tests> + <help> <![CDATA[ + **What it does** + MAFFT is a multiple sequence alignment program for unix-like operating systems. + It offers a range of multiple alignment methods, L-INS-i (accurate; for alignment of <∼200 sequences), + FFT-NS-2 (fast; for alignment of <∼30,000 sequences), etc. + From the MAFFT man page, an overview of the different predefined flavours of the tool. + **Accuracy-oriented methods:** + - L-INS-i (probably most accurate; recommended for <200 sequences; iterative refinement method incorporating local pairwise alignment information): + - mafft --localpair --maxiterate 1000 input [> output] + - G-INS-i (suitable for sequences of similar lengths; recommended for <200 sequences; iterative refinement method incorporating global pairwise alignment information): + - mafft --globalpair --maxiterate 1000 input [> output] + - E-INS-i (suitable for sequences containing large unalignable regions; recommended for <200 sequences): + - mafft --ep 0 --genafpair --maxiterate 1000 input [> output]. For E-INS-i, the --ep 0 option is recommended to allow large gaps. + **Speed-oriented methods:** + - FFT-NS-i (iterative refinement method; two cycles only): + - mafft --retree 2 --maxiterate 2 input [> output] + - FFT-NS-i (iterative refinement method; max. 1000 iterations): + - mafft --retree 2 --maxiterate 1000 input [> output] + - FFT-NS-2 (fast; progressive method): + - mafft --retree 2 --maxiterate 0 input [> output] + - FFT-NS-1 (very fast; recommended for >2000 sequences; progressive method with a rough guide tree): + - mafft --retree 1 --maxiterate 0 input [> output] + - NW-NS-i (iterative refinement method without FFT approximation; two cycles only): + - mafft --retree 2 --maxiterate 2 --nofft input [> output] + - NW-NS-2 (fast; progressive method without the FFT approximation): + - mafft --retree 2 --maxiterate 0 --nofft input [> output] + - NW-NS-PartTree-1 (recommended for ~10,000 to ~50,000 sequences; progressive method with the PartTree algorithm): + - mafft --retree 1 --maxiterate 0 --nofft --parttree input [> output] + + **Options:** + --auto + Automatically selects an appropriate strategy from L-INS-i, FFT-NS-i and FFT-NS-2, according to data size. Default: off (always FFT-NS-2) + --adjustdirection + Generate reverse complement sequences, as necessary, and align them together with the remaining sequences. In the case of protein alignment, these options are just ignored. + --op + Gap opening penalty, default: 1.53 + --ep + Offset (works like gap extension penalty), default: 0.0 + --maxiterate + Maximum number of iterative refinement, default: 0 + --clustalout + Output: clustal format, default: fasta + --thread + Number of threads (if unsure, --thread -1) + --retree number + Guide tree is built number times in the progressive stage. + Valid with 6mer distance. Default: 2 + ]]> + </help> + <expand macro="citations" /> +</tool>
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/add_seq.fa Wed Apr 15 15:33:37 2020 -0400 @@ -0,0 +1,2 @@ +> 1== M63632 1 Lampetra japonica rhodopsin <>[BBRC174,1125-1132'91] +MNGTEGDNFYVPFSNKTGLARSPYEYPQYYLAEPWKYSALAAYMFFLILVGFPVNFLTLF
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/mafft_add_result.aln Wed Apr 15 15:33:37 2020 -0400 @@ -0,0 +1,481 @@ +> 1== M63632 1 Lampetra japonica rhodopsin <>[BBRC174,1125-1132'91] +----------------------------------------MNG----------------T +E--G--DNFYVP----FSNKTGLARSPYEYPQY-------YLAEPWK---------YSAL +AAYMFFLILVGFPVNFLTLFVTVQHKKLRTPLNYILLNLAMANLFMVLFG-FTVTMYTSM +N-GYFV--FGPTMCSIEGFFATLGGEVALWSLVVLAIERYIVICKPMGN-FRFGNTHAIM +GVAFTWIMALAC-AAPPLVG-W-----SRYIPEGMQCSCGPDYYTLNPNFNNESYVVYMF +VVHFLVPFVIIFFCYGRLLCTV----KEAAAAQQ-------------------------- +------------------------------------------------------------ +------------------------------------------------------------ +-------------ESASTQK------AEKEVTRMVVLMVIGFLVCWVPYASVAFYIFT-H +QGS--DFGATFMTLPAFFAKSSALYNPVIYILMNKQFRNCMITTLCC--------GKNPL +GDDE--SGASTSKTEVSSVS-TSPVSPA-------------------------------- +--------------------------------------------------------- +> 2== U22180 1 rat opsin <rod>[J.Mol.Neurosci.5(3),207-209'94] +----------------------------------------MNG----------------T +E--G--PNFYVP----FSNITGVVRSPFEQPQY-------YLAEPWQ---------FSML +AAYMFLLIVLGFPINFLTLYVTVQHKKLRTPLNYILLNLAVADLFMVFGG-FTTTLYTSL +H-GYFV--FGPTGCNLEGFFATLGGEIGLWSLVVLAIERYVVVCKPMSN-FRFGENHAIM +GVAFTWVMALAC-AAPPLVG-W-----SRYIPEGMQCSCGIDYYTLKPEVNNESFVIYMF +VVHFTIPMIVIFFCYGQLVFTV----KEAAAQQQ-------------------------- +------------------------------------------------------------ +------------------------------------------------------------ +-------------ESATTQK------AEKEVTRMVIIMVIFFLICWLPYASVAMYIFT-H +QGS--NFGPIFMTLPAFFAKTASIYNPIIYIMMNKQFRNCMLTSLCC--------GKNPL +GDDE--ASATASKTE------TSQVAPA-------------------------------- +--------------------------------------------------------- +> 3== M92038 1 chicken green sensitive cone opsin <retina>[PNAS89,5932-5936'9 +----------------------------------------MNG----------------T +E--G--INFYVP----MSNKTGVVRSPFEYPQY-------YLAEPWK---------YRLV +CCYIFFLISTGLPINLLTLLVTFKHKKLRQPLNYILVNLAVADLFMACFG-FTVTFYTAW +N-GYFV--FGPVGCAVEGFFATLGGQVALWSLVVLAIERYIVVCKPMGN-FRFSATHAMM +GIAFTWVMAFSC-AAPPLFG-W-----SRYMPEGMQCSCGPDYYTHNPDYHNESYVLYMF +VIHFIIPVVVIFFSYGRLICKV----REAAAQQQ-------------------------- +------------------------------------------------------------ +------------------------------------------------------------ +-------------ESATTQK------AEKEVTRMVILMVLGFMLAWTPYAVVAFWIFT-N +KGA--DFTATLMAVPAFFSKSSSLYNPIIYVLMNKQFRNCMITTICC--------GKNPF +GDEDVSSTVSQSKTEVSSVS-SSQVSPA-------------------------------- +--------------------------------------------------------- +> 4=p A45229 opsin, green-sensitive (clone GFgr-1) - goldfish +----------------------------------------MNG----------------T +E--G--KNFYVP----MSNRTGLVRSPFEYPQY-------YLAEPWQ---------FKIL +ALYLFFLMSMGLPINGLTLVVTAQHKKLRQPLNFILVNLAVAGTIMVCFG-FTVTFYTAI +N-GYFV--LGPTGCAVEGFMATLGGEVALWSLVVLAIERYIVVCKPMGS-FKFSSSHAFA +GIAFTWVMALAC-AAPPLFG-W-----SRYIPEGMQCSCGPDYYTLNPDYNNESYVIYMF +VCHFILPVAVIFFTYGRLVCTV----KAAAAQQQ-------------------------- +------------------------------------------------------------ +------------------------------------------------------------ +-------------DSASTQK------AEREVTKMVILMVFGFLIAWTPYATVAAWIFF-N +KGA--DFSAKFMAIPAFFSKSSALYNPVIYVLLNKQFRNCMLTTIFC--------GKNPL +GDDE-SSTVSTSKTEVSS------VSPA-------------------------------- +--------------------------------------------------------- +> 5=p B45229 opsin, green-sensitive (clone GFgr-2) - goldfish +----------------------------------------MNG----------------T +E--G--NNFYVP----LSNRTGLVRSPFEYPQY-------YLAEPWQ---------FKLL +AVYMFFLICLGLPINGLTLICTAQHKKLRQPLNFILVNLAVAGAIMVCFG-FTVTFYTAI +N-GYFA--LGPTGCAVEGFMATLGGEVALWSLVVLAIERYIVVCKPMGS-FKFSSTHASA +GIAFTWVMAMAC-AAPPLVG-W-----SRYIPEGIQCSCGPDYYTLNPEYNNESYVLYMF +ICHFILPVTIIFFTYGRLVCTV----KAAAAQQQ-------------------------- +------------------------------------------------------------ +------------------------------------------------------------ +-------------DSASTQK------AEREVTKMVILMVLGFLVAWTPYATVAAWIFF-N +KGA--AFSAQFMAIPAFFSKTSALYNPVIYVLLNKQFRSCMLTTLFC--------GKNPL +GDEE-SSTVSTSKTEVSS------VSPA-------------------------------- +--------------------------------------------------------- +> 6== L11864 1 Carassius auratus blue cone opsin <retina>[Biochemistry32,208- +----------------------------------------MKQ----------------V +PEFH--EDFYIPIPLDINNLS--AYSPFLVPQD-------HLGNQGI---------FMAM +SVFMFFIFIGGASINILTILCTIQFKKLRSHLNYILVNLSIANLFVAIFG-SPLSFYSFF +N-RYFI--FGATACKIEGFLATLGGMVGLWSLAVVAFERWLVICKPLGN-FTFKTPHAIA +GCILPWISALAA-SLPPLFG-W-----SRYIPEGLQCSCGPDWYTTNNKYNNESYVMFLF +CFCFAVPFGTIVFCYGQLLITL----KLAAKAQA-------------------------- +------------------------------------------------------------ +------------------------------------------------------------ +-------------DSASTQK------AEREVTKMVVVMVLGFLVCWAPYASFSLWIVS-H +RGE--EFDLRMATIPSCLSKASTVYNPVIYVLMNKQFRSCMM-KMVC--------GKN-I +EEDE--ASTSSQVTQVSS------VAPEK------------------------------- +--------------------------------------------------------- +> 7== M13299 1 human BCP <>[Science232(4747),193-202'86] +----------------------------------------MRK----------------M +S--E--EEFYL-----FKNIS--SVGPWDGPQY-------HIAPVWA---------FYLQ +AAFMGTVFLIGFPLNAMVLVATLRYKKLRQPLNYILVNVSFGGFLLCIFS-VFPVFVASC +N-GYFV--FGRHVCALEGFLGTVAGLVTGWSLAFLAFERYIVICKPFGN-FRFSSKHALT +VVLATWTIGIGV-SIPPFFG-W-----SRFIPEGLQCSCGPDWYTVGTKYRSESYTWFLF +IFCFIVPLSLICFSYTQLLRAL----KAVAAQQQ-------------------------- +------------------------------------------------------------ +------------------------------------------------------------ +-------------ESATTQK------AEREVSRMVVVMVGSFCVCYVPYAAFAMYMVN-N +RNH--GLDLRLVTIPSFFSKSACIYNPIIYCFMNKQFQACIM-KMVC--------GKA-M +TDES--DTCSSQKTEVSTVS-STQVGPN-------------------------------- +--------------------------------------------------------- +> 8=opsin, greensensitive human (fragment) S07060 +------------------------------------------------------------ +------------------------------------------------------------ +------------------------------------------DLAETVIA-STISIVNQV +S-GYFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWLVVCKPFGN-VRFDAKLAIV +GIAFSWIWAAVW-TAPPIFG-W-----SRYWPHGLKTSCGPDVFSGSSYPGVQSYMIVLM +VTCCITPLSIIVLCYLQVWLAI----RAVAKQQK-------------------------- +------------------------------------------------------------ +------------------------------------------------------------ +-------------ESESTQK------AEKEVTRMVVVMVLAFC----------------- +------------------------------------------------------------ +------------------------------------------------------------ +--------------------------------------------------------- +> 9== K03494 1 human GCP <>[Science232(4747),193-202'86] +----------------------------------------MAQQWSLQRLAGRHPQDSYE +DSTQ--SSIFT-----YTNSNS-TRGPFEGPNY-------HIAPRWV---------YHLT +SVWMIFVVIASVFTNGLVLAATMKFKKLRHPLNWILVNLAVADLAETVIA-STISVVNQV +Y-GYFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWMVVCKPFGN-VRFDAKLAIV +GIAFSWIWAAVW-TAPPIFG-W-----SRYWPHGLKTSCGPDVFSGSSYPGVQSYMIVLM +VTCCITPLSIIVLCYLQVWLAI----RAVAKQQK-------------------------- +------------------------------------------------------------ +------------------------------------------------------------ +-------------ESESTQK------AEKEVTRMVVVMVLAFCFCWGPYAFFACFAAA-N +PGY--PFHPLMAALPAFFAKSATIYNPVIYVFMNRQFRNCIL-QLF---------GKK-V +DDGS--ELSSASKTEVSSV---SSVSPA-------------------------------- +--------------------------------------------------------- +> 10== Z68193 1 human Red Opsin <>[] +----------------------------------------MAQQWSLQRLAGRHPQDSYE +DSTQ--SSIFT-----YTNSNS-TRGPFEGPNY-------HIAPRWV---------YHLT +SVWMIFVVTASVFTNGLVLAATMKFKKLRHPLNWILVNLAVADLAETVIA-STISIVNQV +S-GYFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWLVVCKPFGN-VRFDAKLAIV +GIAFSWIWSAVW-TAPPIFG-W-----SRYWPHGLKTSCGPDVFSGSSYPGVQSYMIVLM +VTCCIIPLAIIMLCYLQVWLAI----RAVAKQQK-------------------------- +------------------------------------------------------------ +------------------------------------------------------------ +-------------ESESTQK------AEKEVTRMVVVMIFAYCVCWGPYTFFACFAAA-N +PGY--AFHPLMAALPAYFAKSATIYNPVIYVFMNRQFRNCIL-QLF---------GKK-V +DDGS--ELSSASKTEVSSV---SSVSPA-------------------------------- +--------------------------------------------------------- +> 11== M92036 1 Gecko gecko P521 <retina>[PNAS89,6841-6845'92] +----------------------------------------MTEAWNVAVFAARRSRDD-D +DTTR--GSVFT-----YTNTNN-TRGPFEGPNY-------HIAPRWV---------YNLV +SFFMIIVVIASCFTNGLVLVATAKFKKLRHPLNWILVNLAFVDLVETLVA-STISVFNQI +F-GYFI--LGHPLCVIEGYVVSSCGITGLWSLAIISWERWFVVCKPFGN-IKFDSKLAII +GIVFSWVWAWGW-SAPPIFG-W-----SRYWPHGLKTSCGPDVFSGSVELGCQSFMLTLM +ITCCFLPLFIIIVCYLQVWMAI----RAVAAQQK-------------------------- +------------------------------------------------------------ +------------------------------------------------------------ +-------------ESESTQK------AEREVSRMVVVMIVAFCICWGPYASFVSFAAA-N +PGY--AFHPLAAALPAYFAKSATIYNPVIYVFMNRQFRNCIM-QLF---------GKK-V +DDGS--EASTTSRTEVSSVS-NSSVAPA-------------------------------- +--------------------------------------------------------- +> 12== M62903 1 chicken visual pigment <>[BBRC173,1212-1217'90] +----------------------------------------MAA-WEAAFAARRRHEE--E +DTTR--DSVFT-----YTNSNN-TRGPFEGPNY-------HIAPRWV---------YNLT +SVWMIFVVAASVFTNGLVLVATWKFKKLRHPLNWILVNLAVADLGETVIA-STISVINQI +S-GYFI--LGHPMCVVEGYTVSACGITALWSLAIISWERWFVVCKPFGN-IKFDGKLAVA +GILFSWLWSCAW-TAPPIFG-W-----SRYWPHGLKTSCGPDVFSGSSDPGVQSYMVVLM +VTCCFFPLAIIILCYLQVWLAI----RAVAAQQK-------------------------- +------------------------------------------------------------ +------------------------------------------------------------ +-------------ESESTQK------AEKEVSRMVVVMIVAYCFCWGPYTFFACFAAA-N +PGY--AFHPLAAALPAYFAKSATIYNPIIYVFMNRQFRNCIL-QLF---------GKK-V +DDGS--EVST-SRTEVSSVS-NSSVSPA-------------------------------- +--------------------------------------------------------- +> 13== S75720 1 chicken P-opsin <>[Science267(5203),1502-1506'95] +----------------------------------------MS-----------------S +NSSQ--AP-----------PNG-TPGPFDGPQW------PYQAPQST---------YVGV +AVLMGTVVACASVVNGLVIVVSICYKKLRSPLNYILVNLAVADLLVTLCG-SSVSLSNNI +N-GFFV--FGRRMCELEGFMVSLTGIVGLWSLAILALERYVVVCKPLGD-FQFQRRHAVS +GCAFTWGWALLW-SAPPLLG-W-----SSYVPEGLRTSCGPNWYTGGSNN--NSYILSLF +VTCFVLPLSLILFSYTNLLLTL----RAAAAQQK-------------------------- +------------------------------------------------------------ +------------------------------------------------------------ +-------------EADTTQR------AEREVTRMVIVMVMAFLLCWLPYSTFALVVAT-H +KGI--IIQPVLASLPSYFSKTATVYNPIIYVFMNKQFQSCLL-EMLCCGY----QPQR-T +GKAS--PGTPGPHADVTAAGLRNKVMPAHPV----------------------------- +--------------------------------------------------------- +> 14== M17718 1 D.melanogaster Rh3 <>[J.Neurosci.7,1550-1557'87] +----------MESGNVSS------------SLFGNVST-ALRP----------------E +ARLS--A----------ETRLLGWNVPPEELR--------HIPEHWLTYPEPPESMNYLL +GTLYIFFTLMSMLGNGLVIWVFSAAKSLRTPSNILVINLAFCDFMMMVK--TPIFIYNSF +H-QGYA--LGHLGCQIFGIIGSYTGIAAGATNAFIAYDRFNVITRPMEG--KMTHGKAIA +MIIFIYMYATPW-VVACYTETW-----GRFVPEGYLTSCTFDYLT--DNFDTRLFVACIF +FFSFVCPTTMITYYYSQIVGHVFSHEKALRDQAKK------------------------- +--------------------------------------------------MN-------- +--VESL------------------------------------------------------ +----------RSNVDKNKET------AEIRIAKAAITICFLFFCSWTPYGVMSLIGAF-G +DKT--LLTPGATMIPACACKMVACIDPFVYAISHPRYRMELQKRCPWLAL---------N +EKAP--ESSAVASTSTTQEP--QQTTAA-------------------------------- +--------------------------------------------------------- +> 15== X65879 1 Drosophila pseudoobscura Dpse\Rh3 <>[Genetics132(1),193-204'92 +----------MEYHNVSS------------VL-GNVSS-VLRP----------------D +ARLS--A----------ESRLLGWNVPPDELR--------HIPEHWLIYPEPPESMNYLL +GTLYIFFTVISMIGNGLVMWVFSAAKSLRTPSNILVINLAFCDFMMMIK--TPIFIYNSF +H-QGYA--LGHLGCQIFGVIGSYTGIAAGATNAFIAYDRYNVITRPMEG--KMTHGKAIA +MIIFIYLYATPW-VVACYTESW-----GRFVPEGYLTSCTFDYLT--DNFDTRLFVACIF +FFSFVCPTTMITYYYSQIVGHVFSHEKALRDQAKK------------------------- +--------------------------------------------------MN-------- +--VDSL------------------------------------------------------ +----------RSNVDKSKEA------AEIRIAKAAITICFLFFASWTPYGVMSLIGAF-G +DKT--LLTPGATMIPACTCKMVACIDPFVYAISHPRYRMELQKRCPWLAI---------S +EKAP--ESRAAISTSTTQEQ--QQTTAA-------------------------------- +--------------------------------------------------------- +> 16== M17730 1 D.melanogaster Rh4 opsin <>[J.Neurosci.7,1558-1566'87] +----------ME------------------PL-CNASEPPLRP----------------E +AR-S--SG---N----GDLQFLGWNVPPDQIQ--------YIPEHWLTQLEPPASMHYML +GVFYIFLFCASTVGNGMVIWIFSTSKSLRTPSNMFVLNLAVFDLIMCLK--APIF--NSF +H-RGFAIYLGNTWCQIFASIGSYSGIGAGMTNAAIGYDRYNVITKPMNR--NMTFTKAVI +MNIIIWLYCTPW-VVLPLTQFW-----DRFVPEGYLTSCSFDYLS--DNFDTRLFVGTIF +FFSFVCPTLMILYYYSQIVGHVFSHEKALREQAKK------------------------- +--------------------------------------------------MN-------- +--VESL------------------------------------------------------ +----------RSNVDKSKET------AEIRIAKAAITICFLFFVSWTPYGVMSLIGAF-G +DKS--LLTQGATMIPACTCKLVACIDPFVYAISHPRYRLELQKRCPWLGV---------N +EKSG--EISSAQST-TTQEQ--QQTTAA-------------------------------- +--------------------------------------------------------- +> 17== X65880 1 Drosophila pseudoobscura Dpse\Rh4 <>[Genetics132(1),193-204'92 +----------MD------------------AL-CNASEPPLRP----------------E +ARMS--SG---S----DELQFLGWNVPPDQIQ--------YIPEHWLTQLEPPASMHYML +GVFYIFLFFASTLGNGMVIWIFSTSKSLRTPSNMFVLNLAVFDLIMCLK--APIFIYNSF +H-RGFA--LGNTWCQIFASIGSYSGIGAGMTNAAIGYDRYNVITKPMNR--NMTFTKAVI +MNIIIWLYCTPW-VVLPLTQFW-----DRFVPEGYLTSCSFDYLS--DNFDTRLFVGTIF +LFSFVVPTLMILYYYSQIVGHVFNHEKALREQAKK------------------------- +--------------------------------------------------MN-------- +--VESL------------------------------------------------------ +----------RSNVDKSKET------AEIRIAKAAITICFLFFVSWTPYGVMSLIGAF-G +DKS--LLTPGATMIPACTCKLVACIEPFVYAISHPRYRMELQKRCPWLGV---------N +EKSG--EASSAQST-TTQEQ-TQQTSAA-------------------------------- +--------------------------------------------------------- +> 18== D50584 1 Hemigrapsus sanguineus opsin BcRh2 <compound eye>[J.Exp.Biol.1 +--------------------------------MTNATGPQMAY----------------Y +GAAS--MD-FGY----PEGVSIVDFVRPEIKP--------YVHQHWYNYPPVNPMWHYLL +GVIYLFLGTVSIFGNGLVIYLFNKSAALRTPANILVVNLALSDLIMLTTN-VPFFTYNCF +SGGVWM--FSPQYCEIYACLGAITGVCSIWLLCMISFDRYNIICNGFNG-PKLTTGKAVV +FALISWVIAIGC-ALPPFFG-W-----GNYILEGILDSCSYDYLT--QDFNTFSYNIFIF +VFDYFLPAAIIVFSYVFIVKAIFAHEAAMRAQAKK------------------------- +--------------------------------------------------MN-------- +--VSTL------------------------------------------------------ +----------RS-NEADAQR------AEIRIAKTALVNVSLWFICWTPYALISLKGVM-G +DTS--GITPLVSTLPALLAKSCSCYNPFVYAISHPKYRLAITQHLPWFCV------HE-T +ETKS--NDDSQSNSTVAQDK-A-------------------------------------- +--------------------------------------------------------- +> 19== D50583 1 Hemigrapsus sanguineus opsin BcRh1 <compound eye>[J.Exp.Biol.1 +--------------------------------MANVTGPQMAF----------------Y +GSGA--AT-FGY----PEGMTVADFVPDRVKH--------MVLDHWYNYPPVNPMWHYLL +GVVYLFLGVISIAGNGLVIYLYMKSQALKTPANMLIVNLALSDLIMLTTN-FPPFCYNCF +SGGRWM--FSGTYCEIYAALGAITGVCSIWTLCMISFDRYNIICNGFNG-PKLTQGKATF +MCGLAWVISVGW-SLPPFFG-W-----GSYTLEGILDSCSYDYFT--RDMNTITYNICIF +IFDFFLPASVIVFSYVFIVKAIFAHEAAMRAQAKK------------------------- +--------------------------------------------------MN-------- +--VTNL------------------------------------------------------ +----------RS-NEAETQR------AEIRIAKTALVNVSLWFICWTPYAAITIQGLL-G +NAE--GITPLLTTLPALLAKSCSCYNPFVYAISHPKFRLAITQHLPWFCV------HE-K +DPND--VEENQSSNTQTQEK-S-------------------------------------- +--------------------------------------------------------- +> 20== K02320 1 D.melanogaster opsin <>[Cell40,851-858'85] +----------ME----SF------------AVAAAQLGPHFAP----------------L +S-----------------NGSVVDKVTPDMAH--------LISPYWNQFPAMDPIWAKIL +TAYMIMIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAISDFGIMITN-TPMMGINLY +F-ETWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQVIVKGMAG-RPMTIPLALG +KM---------------------------YVPEGNLTSCGIDYLE--RDWNPRSYLIFYS +IFVYYIPLFLICYSYWFIIAAVSAHEKAMREQAKK------------------------- +--------------------------------------------------MN-------- +--VKSL------------------------------------------------------ +----------RS-SEDAEKS------AEGKLAKVALVTITLWFMAWTPYLVINCMGLF-K +F-E--GLTPLNTIWGACFAKSAACYNPIVYGISHPKYRLALKEKCPCCVF------GK-V +DDGK--SSDAQSQA-TASEA-ESKA----------------------------------- +--------------------------------------------------------- +> 21== K02315 1 D.melanogaster ninaE <>[Cell40,839-850'85] +----------ME----SF------------AVAAAQLGPHFAP----------------L +S-----------------NGSVVDKVTPDMAH--------LISPYWNQFPAMDPIWAKIL +TAYMIMIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAISDFGIMITN-TPMMGINLY +F-ETWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQVIVKGMAG-RPMTIPLALG +KIAYIWFMSSIW-CLAPAFG-W-----SRYVPEGNLTSCGIDYLE--RDWNPRSYLIFYS +IFVYYIPLFLICYSYWFIIAAVSAHEKAMREQAKK------------------------- +--------------------------------------------------MN-------- +--VKSL------------------------------------------------------ +----------RS-SEDAEKS------AEGKLAKVALVTITLWFMAWTPYLVINCMGLF-K +F-E--GLTPLNTIWGACFAKSAACYNPIVYGISHPKYRLALKEKCPCCVF------GK-V +DDGK--SSDAQSQA-TASEA-ESKA----------------------------------- +--------------------------------------------------------- +> 22== X65877 1 Drosophila pseudoobscura Dpse\ninaE <>[Genetics132(1),193-204' +----------MD----SF------------AAVATQLGPQFAA----------------P +S-----------------NGSVVDKVTPDMAH--------LISPYWDQFPAMDPIWAKIL +TAYMIIIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAISDFGIMITN-TPMMGINLY +F-ETWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQVIVKGMAG-RPMTIPLALG +KIAYIWFMSTIWCCLAPVFG-W-----SRYVPEGNLTSCGIDYLE--RDWNPRSYLIFYS +IFVYYIPLFLICYSYWFIIAAVSAHEKAMREQAKK------------------------- +--------------------------------------------------MN-------- +--VKSL------------------------------------------------------ +----------RS-SEDADKS------AEGKLAKVALVTISLWFMAWTPYLVINCMGLF-K +F-E--GLTPLNTIWGACFAKSAACYNPIVYGISHPKYRLALKEKCPCCVF------GK-V +DDGK--SSEAQSQA-TTSEA-ESKA----------------------------------- +--------------------------------------------------------- +> 23== M12896 1 D.melanogaster Rh2 <>[Cell44,705-710'86] +-----MERSHLP----ET------------PFDLAHSGPRFQA----------------Q +SSG---------------NGSVLDNVLPDMAH--------LVNPYWSRFAPMDPMMSKIL +GLFTLAIMIISCCGNGVVVYIFGGTKSLRTPANLLVLNLAFSDFCMMASQ-SPVMIINFY +Y-ETWV--LGPLWCDIYAGCGSLFGCVSIWSMCMIAFDRYNVIVKGING-TPMTIKTSIM +KILFIWMMAVFW-TVMPLIG-W-----SAYVPEGNLTACSIDYMT--RMWNPRSYLITYS +LFVYYTPLFLICYSYWFIIAAVAAHEKAMREQAKK------------------------- +--------------------------------------------------MN-------- +--VKSL------------------------------------------------------ +----------RS-SEDCDKS------AEGKLAKVALTTISLWFMAWTPYLVICYFGLF-K +I-D--GLTPLTTIWGATFAKTSAVYNPIVYGISHPKYRIVLKEKCPMCVF------GN-T +DEPK--PDAPASDTETTSEA-DSKA----------------------------------- +--------------------------------------------------------- +> 24== X65878 1 Drosophila pseudoobscura Dpse\Rh2 <>[Genetics132(1),193-204'92 +-----MERSLLP----EP------------PLAMALLGPRFEA----------------Q +TGG---------------NRSVLDNVLPDMAP--------LVNPHWSRFAPMDPTMSKIL +GLFTLVILIISCCGNGVVVYIFGGTKSLRTPANLLVLNLAFSDFCMMASQ-SPVMIINFY +Y-ETWV--LGPLWCDIYAACGSLFGCVSIWSMCMIAFDRYNVIVKGING-TPMTIKTSIM +KIAFIWMMAVFW-TIMPLIG-W-----SSYVPEGNLTACSIDYMT--RQWNPRSYLITYS +LFVYYTPLFMICYSYWFIIATVAAHEKAMRDQAKK------------------------- +--------------------------------------------------MN-------- +--VKSL------------------------------------------------------ +----------RS-SEDCDKS------AENKLAKVALTTISLWFMAWTPYLIICYFGLF-K +I-D--GLTPLTTIWGATFAKTSAVYNPIVYGISHPNDRLVLKEKCPMCVC------GT-T +DEPK--PDAPPSDTETTSEA-ESKD----------------------------------- +--------------------------------------------------------- +> 25== U26026 1 Apis mellifera long-wavelength rhodopsin <>[] +--------------------------------MIAVSGPSYEA----------------F +SYGG--QARF-------NNQTVVDKVPPDMLH--------LIDANWYQYPPLNPMWHGIL +GFVIGMLGFVSAMGNGMVVYIFLSTKSLRTPSNLFVINLAISNFLMMFCM-SPPMVINCY +Y-ETWV--LGPLFCQIYAMLGSLFGCGSIWTMTMIAFDRYNVIVKGLSG-KPLSINGALI +RIIAIWLFSLGW-TIAPMFG-W-----NRYVPEGNMTACGTDYFN--RGLLSASYLVCYG +IWVYFVPLFLIIYSYWFIIQAVAAHEKNMREQAKK------------------------- +--------------------------------------------------MN-------- +--VASL------------------------------------------------------ +----------RS-SENQNTS------AECKLAKVALMTISLWFMAWTPYLVINFSGIF-N +L-V--KISPLFTIWGSLFAKANAVYNPIVYGISHPKYRAALFAKFPSLAC-------A-A +EPSS--DAVSTTSGTTTVTD-NEKSNA--------------------------------- +--------------------------------------------------------- +> 26== L03781 1 Limulus polyphemus opsin <>[PNAS90,6150-6154'93] +----------------------------------MANQLSYSS----------------L +GWPY--QP----------NASVVDTMPKEMLY--------MIHEHWYAFPPMNPLWYSIL +GVAMIILGIICVLGNGMVIYLMMTTKSLRTPTNLLVVNLAFSDFCMMAFM-MPTMTSNCF +A-ETWI--LGPFMCEVYGMAGSLFGCASIWSMVMITLDRYNVIVRGMAA-APLTHKKATL +LLLFVWIWSGGW-TILPFFG-W-----SRYVPEGNLTSCTVDYLT--KDWSSASYVVIYG +LAVYFLPLITMIYCYFFIVHAVAEHEKQLREQAKK------------------------- +--------------------------------------------------MN-------- +--VASL------------------------------------------------------ +----------RANADQQKQS------AECRLAKVAMMTVGLWFMAWTPYLIISWAGVF-S +SGT--RLTPLATIWGSVFAKANSCYNPIVYGISHPRYKAALYQRFPSLAC------GS-G +ESGS--DVKSEASATTTMEE-KPKIPEA-------------------------------- +--------------------------------------------------------- +> 27== X07797 1 Octopus dofleini rhodopsin <>[FEBS232(1),69-72'88] +---------------------------------------MVES----------------T +TLVN--QT-WWY------NPTVD------------------IHPHWAKFDPIPDAVYYSV +GIFIGVVGIIGILGNGVVIYLFSKTKSLQTPANMFIINLAMSDLSFSAINGFPLKTISAF +M-KKWI--FGKVACQLYGLLGGIFGFMSINTMAMISIDRYNVIGRPMAASKKMSHRRAFL +MIIFVWMWSIVW-SVGPVFN-W-----GAYVPEGILTSCSFDYLS--TDPSTRSFILCMY +FCGFMLPIIIIAFCYFNIVMSVSNHEKEMAAMAKR------------------------- +--------------------------------------------------LN-------- +--AKEL------------------------------------------------------ +----------R--KAQAGAS------AEMKLAKISMVIITQFMLSWSPYAIIALLAQF-G +PAE--WVTPYAAELPVLFAKASAIHNPIVYSVSHPKFREAIQTTFPWLLTCCQFDEKE-C +EDAN--DAEEEVVASER--G-GESRDAAQMKEMMAMMQKMQAQQAAYQPPPPPQGY--PP +QGYPPQGAYPPPQGYPPQGYPPQGYPPQGYPPQGAPPQVEAPQGAPPQGVDNQAYQA +> 28== X70498 1 Todarodes pacificus rhodopsin <retina>[FEBS317(1-2),5-11'93] +----------------------------------------MGR----------------D +LRDN--ET-WWY------NPSIV------------------VHPHWREFDQVPDAVYYSL +GIFIGICGIIGCGGNGIVIYLFTKTKSLQTPANMFIINLAFSDFTFSLVNGFPLMTISCF +L-KKWI--FGFAACKVYGFIGGIFGFMSIMTMAMISIDRYNVIGRPMAASKKMSHRRAFI +MIIFVWLWSVLW-AIGPIFG-W-----GAYTLEGVLCNCSFDYIS--RDSTTRSNILCMF +ILGFFGPILIIFFCYFNIVMSVSNHEKEMAAMAKR------------------------- +--------------------------------------------------LN-------- +--AKEL------------------------------------------------------ +----------R--KAQAGAN------AEMRLAKISIVIVSQFLLSWSPYAVVALLAQF-G +PLE--WVTPYAAQLPVMFAKASAIHNPMIYSVSHPKFREAISQTFPWVLTCCQFDDKE-T +EDDK--DAETEIPAGESSDA-APSADAAQMKEMMAMMQKMQQQQAAY----PPQGYAPPP +QGYPPQGY--PPQGYPPQGYPPQGYPP---PPQGAPPQ-GAPPAAPPQGVDNQAYQA +> 29== L21195 1 human serotonin 5-HT7 receptor protein <placenta and fetal bra +---------MMDVNSSGRPDLYGHLRSFL-LPEVGRGLPDLSPDGGA------------D +PVAGSWAPHLLS------EVTASPAPTWDAPPDNASGCGEQIN--------YGRVEKVVI +GSILTLITLLTIAGNCLVVISVCFVKKLRQPSNYLIVSLALADLSVAVAV-MPFVSVTDL +IGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYLGITRPLTYPVRQNGKCMAK +MILSVWLLSASI-TLPPLFG-W-----AQNVNDDKVCLISQDF----------GYTIYST +AVAFYIPMSVMLFMYYQIY-------KAARKSAAKHKF---------------------- +---------------------------------PGFPRV----EPDSVIALNG------- +--IVKL----------------------QK---------EVEECAN-------------- +----LSRLLKHERKNISIFK------REQKAATTLGIIVGAFTVCWLPFFLLSTARPFIC +GTSCSCIPLWVERTFLWLGYANSLINPFIYAFFNRDLRTTYRSLLQCQYR----NINR-- +------KLSAAGMHEALKLAERPERPEF------------VLQNADY------------- +--------------------------------------------CRKKGHDS----- +> 30== L15228 1 rat 5HT-7 serotonin receptor <>[JBC268,18200-18204'93] +------------------------------------------------------------ +------MPHLLS---GFLEVTASPAPTWDAPPDNVSGCGEQIN--------YGRVEKVVI +GSILTLITLLTIAGNCLVVISVSFVKKLRQPSNYLIVSLALADLSVAVAV-MPFVSVTDL +IGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYLGITRPLTYPVRQNGKCMAK +MILSVWLLSASI-TLPPLFG-W-----AQNVNDDKVCLISQDF----------GYTIYST +AVAFYIPMSVMLFMYYQIY-------KAARKSAAKHKF---------------------- +---------------------------------PGFPRV----QPESVISLNG------- +--VVKL----------------------QK---------EVEECAN-------------- +----LSRLLKHERKNISIFK------REQKAATTLGIIVGAFTVCWLPFFLLSTARPFIC +GTSCSCIPLWVERTCLWLGYANSLINPFIYAFFNRDLRPTSRSLLQCQYR----NINR-- +------KLSAAGMHEALKLAERPERSEF------------VLQNSDH------------- +--------------------------------------------CGKKGHDT----- +> 31=p A47425 serotonin receptor 5HT-7 - rat +------------------------------------------------------------ +------MPHLLS---GFLEVTASPAPTWDAPPDNVSGCGEQIN--------YGRVEKVVI +GSILTLITLLTIAGNCLVVISVSFVKKLRQPSNYLIVSLALADLSVAVAV-MPFVSVTDL +IGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYLGITRPLTYPVRQNGKCMAK +MILSVWLLSASI-TLPPLFG-W-----AQNVNDDKVCLISQDF----------GYTIYST +AVAFYIPMSVMLFMYYQIY-------KAARKSAAKHKF---------------------- +---------------------------------PGFPRV----QPESVISLNG------- +--VVKL----------------------QK---------EVEECAN-------------- +----LSRLLKHERKNISIFK------REQKAATTLGIIVGAFTVCWLPFFLLSTARPFIC +GTSCSCIPLWVERTCLWLGYANSLINPFIYAFFNRDLRTTYRSLLQCQYR----NINR-- +------KLSAAGMHEALKLAERPERSEF------------VLQNSDH------------- +--------------------------------------------CGKKGHDT----- +> 32== M83181 1 human serotonin receptor <>[JBC267(11),7553-7562'92] +----------MDVLSP-------------------------------------------- +---------------GQGNNTTSPPAPFET-GGNTTGISDVT---------VSYQ--VIT +SLLLGTLIFCAVLGNACVVAAIALERSLQNVANYLIGSLAVTDLMVSVLV-LPMAALYQV +L-NKWT--LGQVTCDLFIALDVLCCTSSILHLCAIALDRYWAITDPIDYVNKRTPRRAAA +LISLTWLIGFLI-SIPPMLG-WRTPEDRSDPD---ACTISKDH----------GYTIYST +FGAFYIPLLLMLVLYGRIF-------RAARFRIRK------------------------- +--------------TVKKVEKTGADTRHGASPAPQPKKS-----------VNGESGSR-- +-------NWRLGVESKAGGALCANGAVRQGDDGAALEVIEVHRVGNSKEHLPLPSEAG-- +PTPCAPASFERKNERNAEAKRKMALARERKTVKTLGIIMGTFILCWLPFFIVALVLPF-C +ESSC-HMPTLLGAIINWLGYSNSLLNPVIYAYFNKDFQNAFKKIIKCKFC----RQ---- +------------------------------------------------------------ +--------------------------------------------------------- +> 33=p A35181 serotonin receptor class 1A - rat +----------MDVFSF-------------------------------------------- +---------------GQGNNTTASQEPFGT-GGNVTSISDVT---------FSYQ--VIT +SLLLGTLIFCAVLGNACVVAAIALERSLQNVANYLIGSLAVTDLMVSVLV-LPMAALYQV +L-NKWT--LGQVTCDLFIALDVLCCTSSILHLCAIALDRYWAITDPIDYVNKRTPRRAAA +LISLTWLIGFLI-SIPPMLG-WRTPEDRSDPD---ACTISKDH----------GYTIYST +FGAFYIPLLLMLVLYGRIF-------RAARFRIRK------------------------- +--------------TVRKVEKKGAGTSLGTSSAPPPKKS-----------LNGQPGSG-- +-------DWRRCAENRAVGTPCTNGAVRQGDDEATLEVIEVHRVGNSKEHLPLPSESG-- +SNSYAPACLERKNERNAEAKRKMALARERKTVKTLGIIMGTFILCWLPFFIVALVLPF-C +ESSC-HMPALLGAIINWLGYSNSLLNPVIYAYFNKDFQNAFKKIIKCKFC----RR---- +------------------------------------------------------------ +--------------------------------------------------------- +> 34== L06803 1 Lymnaea stagnalis serotonin receptor <>[PNAS90,11-15'93] +MANFTFGDLALDVARMG-----GLASTPSGLRSTGLTTPGLSPTGLV------------T +SDFN--DSYGLT---GQFINGSHSSRSRDNASANDTSATNMTDDRYWSLTVYSHEHLVLT +SVILGLFVLCCIIGNCFVIAAVMLERSLHNVANYLILSLAVADLMVAVLV-MPLSVVSEI +S-KVWF--LHSEVCDMWISVDVLCCTASILHLVAIAMDRYWAVTS-IDYIRRRSARRILL +MIMVVWIVALFI-SIPPLFG-WRDP--NNDPDKTGTCIISQDK----------GYTIFST +VGAFYLPMLVMMIIYIRIW-------LVARSRIRKDKFQMTKARLKTEETTLVASPKTEY +SVVSDCNGCNSPDSTTEKKKRRAPFKSYGCSPRPERKKNRAKKLPENANGVNSNSSS--- +-------SERLKQIQIETAEAFANGCA----EEASIAMLERQ-CNNGKKISSNDTPYS-- +-----------RTREKLELK------RERKAARTLAIITGAFLICWLPFFIIALIGPF-V +DPE--GIPPFARSFVLWLGYFNSLLNPIIYTIFSPEFRSAFQKILFGKYR----RGHR-- +------------------------------------------------------------ +--------------------------------------------------------- +> 35=p A47174 serotonin receptor, 5HTlym receptor - great pond snail +MANFTFGDLALDVARMG-----GLASTPSGLRSTGLTTPGLSPTGLV------------T +SDFN--DSYGLT---GQFINGSHSSRSRDNASANDTSATNMTDDRYWSLTVYSHEHLVLT +SVILGLFVLCCIIGNCFVIAAVMLERSLHNVANYLILSLAVADLMVAVLV-MPLSVVSEI +S-KVWF--LHSEVCDMWISVDVLCCTASILHLVAIAMDRYWAVTS-IDYIRRRSARRILL +MIMVVWIVALFI-SIPPLFG-WRDP--NNDPDKTGTCIISQDK----------GYTIFST +VGAFYLPMLVMMIIYIRIW-------LVARSRIRKDKFQMTKARLKTEETTLVASPKTEY +SVVSDCNGCNSPDSTTEKKKRRAPFKSYGCSPRPERKKNRAKKLPENANGVNSNSSS--- +-------SERLKQIQIETAEAFANGCA----EEASIAMLERQ-CNNGKKISSNDTPYS-- +-----------RTREKLELK------RERKAARTLAIITGAFLICWLPFFIIALIGPF-V +DPE--GIPPFARSFVLWLGYFNSLLNPIIYTIFSPEFRSAFQKILFGKYR----RGHR-- +------------------------------------------------------------ +--------------------------------------------------------- +> 36== X95604 1 Bombyx mori serotonin receptor <antennae>[InsectBiochem.Mol.Bi +-MEGAEGQEELDWEAL-------YLRLP--LQNCSWNSTGWEPNWNV------------T +VVPN--TTWW------------QASAPFDTPAALVRAAAK-------------------- +AVVLGLLILATVVGNVFVIAAILLERHLRSAANNLILSLAVADLLVACLV-MPLGAVYEV +V-QRWT--LGPELCDMWTSGDVLCCTASILHLVAIALDRYWAVTN-IDYIHASTAKRVGM +MIACVWTVSFFV-CIAQLLG-WKDPDWNQRVSEDLRCVVSQDV----------GYQIFAT +ASSFYVPVLIILILYWRIY-------QTARKRIR-------------------------- +-------------------RRRGATARGGVGPPP---------VPAGGALVAGGGSGGIA +AAVVAVIGRPLPTISETTTTGFTNVSS----NNTSP---EKQSCANGLEADPPTTGYGAV +AAAYYPSLVRRKPKEAADSK------RERKAAKTLAIITGAFVACWLPFFVLAILVPT-C +DCE---VSPVLTSLSLWLGYFNSTLNPVIYTVFSPEFRHAFQRLLCGRRV----RRRR-- +------A---------------PQ------------------------------------ +--------------------------------------------------------- +> 1== M63632 1 Lampetra japonica rhodopsin <>[BBRC174,1125-1132'91] +----------------------------------------MNG----------------T +E--G--DNFYVP----FSNKTGLARSPYEYPQY-------YLAEPWK---------YSAL +AAYMFFLILVGFPVNFLTLF---------------------------------------- +------------------------------------------------------------ +------------------------------------------------------------ +------------------------------------------------------------ +------------------------------------------------------------ +------------------------------------------------------------ +------------------------------------------------------------ +------------------------------------------------------------ +------------------------------------------------------------ +---------------------------------------------------------
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/mafft_custom_result.aln Wed Apr 15 15:33:37 2020 -0400 @@ -0,0 +1,458 @@ +CLUSTAL format alignment by MAFFT F-INS-i (v7.455) + + +1== MN------------------------GTE--GDNFYVPFS--------NKTGL-ARSPYE +2== MN------------------------GTE--GPNFYVPFS--------NITGV-VRSPFE +3== MN------------------------GTE--GINFYVPMS--------NKTGV-VRSPFE +4=p MN------------------------GTE--GKNFYVPMS--------NRTGL-VRSPFE +5=p MN------------------------GTE--GNNFYVPLS--------NRTGL-VRSPFE +6== MK------------------------QVPEFHEDFYIPIP-------LDINNLSAYSPFL +7== MR------------------------KMS--EEEFYL------------FKNISSVGPWD +8=opsin, ------------------------------------------------------------ +9== MAQQWSLQ-RLAGRHPQDS----YEDSTQ--SSIFTYTNS--------NS----TRGPFE +10== MAQQWSLQ-RLAGRHPQDS----YEDSTQ--SSIFTYTNS--------NS----TRGPFE +11== MTEAWNVAVFAARRSRDD------DDTTR--GSVFTYTNT--------NN----TRGPFE +12== MA-AWEAA-FAARRRHEE------EDTTR--DSVFTYTNS--------NN----TRGPFE +13== MS----------------------SNSSQ--------------AP--PNG----TPGPFD +14== MESG-NV-----------------------------------------SSSLFGNVSTAL +15== MEYH-NV------------------------------------------SSVLGNVSSVL +16== MEPLCNA------------------------------------------------SEPPL +17== MDALCNA------------------------------------------------SEPPL +18== MT-------------------------------------------------------NAT +19== MA-------------------------------------------------------NVT +20== ME-------------------------------------------------SFAVAAAQL +21== ME-------------------------------------------------SFAVAAAQL +22== MD-------------------------------------------------SFAAVATQL +23== MERS--------------------------------------------HLPETPFDLAHS +24== MERS--------------------------------------------LLPEPPLAMALL +25== MI-------------------------------------------------------AVS +26== M----------------------------------------------------------- +27== MVESTT------------------------------------------------------ +28== MGRD-------------------------------------------------------- +29== MM-----DVNSSGRPDLYGH-----------LRSFLLPEVGRGLPDLSPDGGADPVAGSW +30== M----------------------------------------------------------- +31=p M----------------------------------------------------------- +32== MD------VLSPGQ----------------------------------GNNTTSPPAPFE +33=p MD------VFSFGQ----------------------------------GNNTTASQEPFG +34== MA------NFTFGDLALDVARMGGLASTPS------------------GLRSTGLTTPGL +35=p MA------NFTFGDLALDVARMGGLASTPS------------------GLRSTGLTTPGL +36== ME-------GAEGQEELD-------------WEALYLRL---------PLQNCSWNSTGW + + +1== YP---------------------------------------------------------- +2== QP---------------------------------------------------------- +3== YP---------------------------------------------------------- +4=p YP---------------------------------------------------------- +5=p YP---------------------------------------------------------- +6== VP---------------------------------------------------------- +7== GP---------------------------------------------------------- +8=opsin, ------------------------------------------------------------ +9== GP---------------------------------------------------------- +10== GP---------------------------------------------------------- +11== GP---------------------------------------------------------- +12== GP---------------------------------------------------------- +13== GP---------------------------------------------------------- +14== RPEARL----------------------SAETRLLGWNVPPEELRHIPEHWL-------- +15== RPDARL----------------------SAESRLLGWNVPPDELRHIPEHWL-------- +16== RPEAR-SSG-------------------NGDLQFLGWNVPPDQIQYIPEHWL-------- +17== RPEARMSSG-------------------SDELQFLGWNVPPDQIQYIPEHWL-------- +18== GPQMAYYGAASMDFG-------------YPEGVSIVDFVRPEIKPYVHQHWY-------- +19== GPQMAFYGSGAATFG-------------YPEGMTVADFVPDRVKHMVLDHWY-------- +20== GPHFAPLS-----------------------NGSVVDKVTPDMAHLISPYWN-------- +21== GPHFAPLS-----------------------NGSVVDKVTPDMAHLISPYWN-------- +22== GPQFAAPS-----------------------NGSVVDKVTPDMAHLISPYWD-------- +23== GPRFQAQSSG---------------------NGSVLDNVLPDMAHLVNPYWS-------- +24== GPRFEAQTGG---------------------NRSVLDNVLPDMAPLVNPHWS-------- +25== GPSYEAFSYG--GQA-------------RFNNQTVVDKVPPDMLHLIDANWY-------- +26== -ANQLSYSSL--GWP-------------YQPNASVVDTMPKEMLYMIHEHWY-------- +27== ----------LVNQT-------------WWYNPTV----------DIHPHWA-------- +28== ---------LRDNET-------------WWYNPSI----------VVHPHWR-------- +29== APHLLS-----------------------------------EVTASPAPTWDAPPDNASG +30== -PHLLSGF--------------------------------LEVTASPAPTWDAPPDNVSG +31=p -PHLLSGF--------------------------------LEVTASPAPTWDAPPDNVSG +32== TG--------------------------------------GNTTGI-------------- +33=p TG--------------------------------------GNVTSI-------------- +34== SPTGLVTSDFNDSYGLTGQFINGSHSSRSRDNASANDTSATNMTD--DRYWSL------- +35=p SPTGLVTSDFNDSYGLTGQFINGSHSSRSRDNASANDTSATNMTD--DRYWSL------- +36== EPNW-------------------------------------NVTVVPNTTWWQ------- + + +1== -----QY-YLAEPWKYSALAAYMFFLILVGFPVNFLTLFVTVQHKKLRTPLNYILLNLAM +2== -----QY-YLAEPWQFSMLAAYMFLLIVLGFPINFLTLYVTVQHKKLRTPLNYILLNLAV +3== -----QY-YLAEPWKYRLVCCYIFFLISTGLPINLLTLLVTFKHKKLRQPLNYILVNLAV +4=p -----QY-YLAEPWQFKILALYLFFLMSMGLPINGLTLVVTAQHKKLRQPLNFILVNLAV +5=p -----QY-YLAEPWQFKLLAVYMFFLICLGLPINGLTLICTAQHKKLRQPLNFILVNLAV +6== -----QD-HLGNQGIFMAMSVFMFFIFIGGASINILTILCTIQFKKLRSHLNYILVNLSI +7== -----QY-HIAPVWAFYLQAAFMGTVFLIGFPLNAMVLVATLRYKKLRQPLNYILVNVSF +8=opsin, ------------------------------------------------------------ +9== -----NY-HIAPRWVYHLTSVWMIFVVIASVFTNGLVLAATMKFKKLRHPLNWILVNLAV +10== -----NY-HIAPRWVYHLTSVWMIFVVTASVFTNGLVLAATMKFKKLRHPLNWILVNLAV +11== -----NY-HIAPRWVYNLVSFFMIIVVIASCFTNGLVLVATAKFKKLRHPLNWILVNLAF +12== -----NY-HIAPRWVYNLTSVWMIFVVAASVFTNGLVLVATWKFKKLRHPLNWILVNLAV +13== -----QWPYQAPQSTYVGVAVLMGTVVACASVVNGLVIVVSICYKKLRSPLNYILVNLAV +14== -----TY-PEPPESMNYLLGTLYIFFTLMSMLGNGLVIWVFSAAKSLRTPSNILVINLAF +15== -----IY-PEPPESMNYLLGTLYIFFTVISMIGNGLVMWVFSAAKSLRTPSNILVINLAF +16== -----TQ-LEPPASMHYMLGVFYIFLFCASTVGNGMVIWIFSTSKSLRTPSNMFVLNLAV +17== -----TQ-LEPPASMHYMLGVFYIFLFFASTLGNGMVIWIFSTSKSLRTPSNMFVLNLAV +18== -----NY-PPVNPMWHYLLGVIYLFLGTVSIFGNGLVIYLFNKSAALRTPANILVVNLAL +19== -----NY-PPVNPMWHYLLGVVYLFLGVISIAGNGLVIYLYMKSQALKTPANMLIVNLAL +20== -----QF-PAMDPIWAKILTAYMIMIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAI +21== -----QF-PAMDPIWAKILTAYMIMIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAI +22== -----QF-PAMDPIWAKILTAYMIIIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAI +23== -----RF-APMDPMMSKILGLFTLAIMIISCCGNGVVVYIFGGTKSLRTPANLLVLNLAF +24== -----RF-APMDPTMSKILGLFTLVILIISCCGNGVVVYIFGGTKSLRTPANLLVLNLAF +25== -----QY-PPLNPMWHGILGFVIGMLGFVSAMGNGMVVYIFLSTKSLRTPSNLFVINLAI +26== -----AF-PPMNPLWYSILGVAMIILGIICVLGNGMVIYLMMTTKSLRTPTNLLVVNLAF +27== -----KF-DPIPDAVYYSVGIFIGVVGIIGILGNGVVIYLFSKTKSLQTPANMFIINLAM +28== -----EF-DQVPDAVYYSLGIFIGICGIIGCGGNGIVIYLFTKTKSLQTPANMFIINLAF +29== CGEQINY----GRVEKVVIGSILTLITLLTIAGNCLVVISVCFVKKLRQPSNYLIVSLAL +30== CGEQINY----GRVEKVVIGSILTLITLLTIAGNCLVVISVSFVKKLRQPSNYLIVSLAL +31=p CGEQINY----GRVEKVVIGSILTLITLLTIAGNCLVVISVSFVKKLRQPSNYLIVSLAL +32== SDVTVSY--------QVITSLLLGTLIFCAVLGNACVVAAIALERSLQNVANYLIGSLAV +33=p SDVTFSY--------QVITSLLLGTLIFCAVLGNACVVAAIALERSLQNVANYLIGSLAV +34== TVYSHEH--------LVLTSVILGLFVLCCIIGNCFVIAAVMLERSLHNVANYLILSLAV +35=p TVYSHEH--------LVLTSVILGLFVLCCIIGNCFVIAAVMLERSLHNVANYLILSLAV +36== --ASAPFDTPAALVRAAAKAVVLGLLILATVVGNVFVIAAILLERHLRSAANNLILSLAV + + +1== ANLFMVLFG-FTVTMYTSMNG-YFV--FGPTMCSIEGFFATLGGEVALWSLVVLAIERYI +2== ADLFMVFGG-FTTTLYTSLHG-YFV--FGPTGCNLEGFFATLGGEIGLWSLVVLAIERYV +3== ADLFMACFG-FTVTFYTAWNG-YFV--FGPVGCAVEGFFATLGGQVALWSLVVLAIERYI +4=p AGTIMVCFG-FTVTFYTAING-YFV--LGPTGCAVEGFMATLGGEVALWSLVVLAIERYI +5=p AGAIMVCFG-FTVTFYTAING-YFA--LGPTGCAVEGFMATLGGEVALWSLVVLAIERYI +6== ANLFVAIFG-SPLSFYSFFNR-YFI--FGATACKIEGFLATLGGMVGLWSLAVVAFERWL +7== GGFLLCIFS-VFPVFVASCNG-YFV--FGRHVCALEGFLGTVAGLVTGWSLAFLAFERYI +8=opsin, -DLAETVIA-STISIVNQVSG-YFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWL +9== ADLAETVIA-STISVVNQVYG-YFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWM +10== ADLAETVIA-STISIVNQVSG-YFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWL +11== VDLVETLVA-STISVFNQIFG-YFI--LGHPLCVIEGYVVSSCGITGLWSLAIISWERWF +12== ADLGETVIA-STISVINQISG-YFI--LGHPMCVVEGYTVSACGITALWSLAIISWERWF +13== ADLLVTLCG-SSVSLSNNING-FFV--FGRRMCELEGFMVSLTGIVGLWSLAILALERYV +14== CDFMMMVK--TPIFIYNSFHQ-GYA--LGHLGCQIFGIIGSYTGIAAGATNAFIAYDRFN +15== CDFMMMIK--TPIFIYNSFHQ-GYA--LGHLGCQIFGVIGSYTGIAAGATNAFIAYDRYN +16== FDLIMCLK--APIF--NSFHR-GFAIYLGNTWCQIFASIGSYSGIGAGMTNAAIGYDRYN +17== FDLIMCLK--APIFIYNSFHR-GFA--LGNTWCQIFASIGSYSGIGAGMTNAAIGYDRYN +18== SDLIMLTTN-VPFFTYNCFSGGVWM--FSPQYCEIYACLGAITGVCSIWLLCMISFDRYN +19== SDLIMLTTN-FPPFCYNCFSGGRWM--FSGTYCEIYAALGAITGVCSIWTLCMISFDRYN +20== SDFGIMITN-TPMMGINLYFE-TWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQ +21== SDFGIMITN-TPMMGINLYFE-TWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQ +22== SDFGIMITN-TPMMGINLYFE-TWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQ +23== SDFCMMASQ-SPVMIINFYYE-TWV--LGPLWCDIYAGCGSLFGCVSIWSMCMIAFDRYN +24== SDFCMMASQ-SPVMIINFYYE-TWV--LGPLWCDIYAACGSLFGCVSIWSMCMIAFDRYN +25== SNFLMMFCM-SPPMVINCYYE-TWV--LGPLFCQIYAMLGSLFGCGSIWTMTMIAFDRYN +26== SDFCMMAFM-MPTMTSNCFAE-TWI--LGPFMCEVYGMAGSLFGCASIWSMVMITLDRYN +27== SDLSFSAINGFPLKTISAFMK-KWI--FGKVACQLYGLLGGIFGFMSINTMAMISIDRYN +28== SDFTFSLVNGFPLMTISCFLK-KWI--FGFAACKVYGFIGGIFGFMSIMTMAMISIDRYN +29== ADLSVAVAV-MPFVSVTDLIGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYL +30== ADLSVAVAV-MPFVSVTDLIGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYL +31=p ADLSVAVAV-MPFVSVTDLIGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYL +32== TDLMVSVLV-LPMAALYQVLN-KWT--LGQVTCDLFIALDVLCCTSSILHLCAIALDRYW +33=p TDLMVSVLV-LPMAALYQVLN-KWT--LGQVTCDLFIALDVLCCTSSILHLCAIALDRYW +34== ADLMVAVLV-MPLSVVSEISK-VWF--LHSEVCDMWISVDVLCCTASILHLVAIAMDRYW +35=p ADLMVAVLV-MPLSVVSEISK-VWF--LHSEVCDMWISVDVLCCTASILHLVAIAMDRYW +36== ADLLVACLV-MPLGAVYEVVQ-RWT--LGPELCDMWTSGDVLCCTASILHLVAIALDRYW + . : : * : : :*: + +1== VICKPMGNFR-FGNTHAIMGVAFTWIMALACA-APPLV-GWSRYIPEGMQCSCGPDYYTL +2== VVCKPMSNFR-FGENHAIMGVAFTWVMALACA-APPLV-GWSRYIPEGMQCSCGIDYYTL +3== VVCKPMGNFR-FSATHAMMGIAFTWVMAFSCA-APPLF-GWSRYMPEGMQCSCGPDYYTH +4=p VVCKPMGSFK-FSSSHAFAGIAFTWVMALACA-APPLF-GWSRYIPEGMQCSCGPDYYTL +5=p VVCKPMGSFK-FSSTHASAGIAFTWVMAMACA-APPLV-GWSRYIPEGIQCSCGPDYYTL +6== VICKPLGNFT-FKTPHAIAGCILPWISALAAS-LPPLF-GWSRYIPEGLQCSCGPDWYTT +7== VICKPFGNFR-FSSKHALTVVLATWTIGIGVS-IPPFF-GWSRFIPEGLQCSCGPDWYTV +8=opsin, VVCKPFGNVR-FDAKLAIVGIAFSWIWAAVWT-APPIF-GWSRYWPHGLKTSCGPDVFSG +9== VVCKPFGNVR-FDAKLAIVGIAFSWIWAAVWT-APPIF-GWSRYWPHGLKTSCGPDVFSG +10== VVCKPFGNVR-FDAKLAIVGIAFSWIWSAVWT-APPIF-GWSRYWPHGLKTSCGPDVFSG +11== VVCKPFGNIK-FDSKLAIIGIVFSWVWAWGWS-APPIF-GWSRYWPHGLKTSCGPDVFSG +12== VVCKPFGNIK-FDGKLAVAGILFSWLWSCAWT-APPIF-GWSRYWPHGLKTSCGPDVFSG +13== VVCKPLGDFQ-FQRRHAVSGCAFTWGWALLWS-APPLL-GWSSYVPEGLRTSCGPNWYTG +14== VITRPMEGK--MTHGKAIAMIIFIYMYATPWV-VACYTETWGRFVPEGYLTSCTFDYLTD +15== VITRPMEGK--MTHGKAIAMIIFIYLYATPWV-VACYTESWGRFVPEGYLTSCTFDYLTD +16== VITKPMNRN--MTFTKAVIMNIIIWLYCTPWV-VLPLTQFWDRFVPEGYLTSCSFDYLSD +17== VITKPMNRN--MTFTKAVIMNIIIWLYCTPWV-VLPLTQFWDRFVPEGYLTSCSFDYLSD +18== IICNGFNGPK-LTTGKAVVFALISWVIAIGCA-LPPFF-GWGNYILEGILDSCSYDYLTQ +19== IICNGFNGPK-LTQGKATFMCGLAWVISVGWS-LPPFF-GWGSYTLEGILDSCSYDYFTR +20== VIVKGMAGRP-MTIPLALGKM----------------------YVPEGNLTSCGIDYLER +21== VIVKGMAGRP-MTIPLALGKIAYIWFMSSIWC-LAPAF-GWSRYVPEGNLTSCGIDYLER +22== VIVKGMAGRP-MTIPLALGKIAYIWFMSTIWCCLAPVF-GWSRYVPEGNLTSCGIDYLER +23== VIVKGINGTP-MTIKTSIMKILFIWMMAVFWT-VMPLI-GWSAYVPEGNLTACSIDYMTR +24== VIVKGINGTP-MTIKTSIMKIAFIWMMAVFWT-IMPLI-GWSSYVPEGNLTACSIDYMTR +25== VIVKGLSGKP-LSINGALIRIIAIWLFSLGWT-IAPMF-GWNRYVPEGNMTACGTDYFNR +26== VIVRGMAAAP-LTHKKATLLLLFVWIWSGGWT-ILPFF-GWSRYVPEGNLTSCTVDYLTK +27== VIGRPMAASKKMSHRRAFLMIIFVWMWSIVWS-VGPVF-NWGAYVPEGILTSCSFDYLST +28== VIGRPMAASKKMSHRRAFIMIIFVWLWSVLWA-IGPIF-GWGAYTLEGVLCNCSFDYISR +29== GITRPLTYPVRQNGKCMAKMILSVWLLSASIT-LPPLF-GWAQNVNDDKVC-----LISQ +30== GITRPLTYPVRQNGKCMAKMILSVWLLSASIT-LPPLF-GWAQNVNDDKVC-----LISQ +31=p GITRPLTYPVRQNGKCMAKMILSVWLLSASIT-LPPLF-GWAQNVNDDKVC-----LISQ +32== AITDPIDYVNKRTPRRAAALISLTWLIGFLIS-IPPML-GWRTPEDRSDPDAC---TISK +33=p AITDPIDYVNKRTPRRAAALISLTWLIGFLIS-IPPML-GWRTPEDRSDPDAC---TISK +34== AVTS-IDYIRRRSARRILLMIMVVWIVALFIS-IPPLF-GWRD--PNNDPDKTGTCIISQ +35=p AVTS-IDYIRRRSARRILLMIMVVWIVALFIS-IPPLF-GWRD--PNNDPDKTGTCIISQ +36== AVTN-IDYIHASTAKRVGMMIACVWTVSFFVC-IAQLL-GWKDPDWNQRVSEDLRCVVSQ + : : + +1== NPNFNNESYVVYMFVVHFLVPFVIIFFCYGRLLCTVKEAAAAQQE--------------- +2== KPEVNNESFVIYMFVVHFTIPMIVIFFCYGQLVFTVKEAAAQQQE--------------- +3== NPDYHNESYVLYMFVIHFIIPVVVIFFSYGRLICKVREAAAQQQE--------------- +4=p NPDYNNESYVIYMFVCHFILPVAVIFFTYGRLVCTVKAAAAQQQD--------------- +5=p NPEYNNESYVLYMFICHFILPVTIIFFTYGRLVCTVKAAAAQQQD--------------- +6== NNKYNNESYVMFLFCFCFAVPFGTIVFCYGQLLITLKLAAKAQAD--------------- +7== GTKYRSESYTWFLFIFCFIVPLSLICFSYTQLLRALKAVAAQQQE--------------- +8=opsin, SSYPGVQSYMIVLMVTCCITPLSIIVLCYLQVWLAIRAVAKQQKE--------------- +9== SSYPGVQSYMIVLMVTCCITPLSIIVLCYLQVWLAIRAVAKQQKE--------------- +10== SSYPGVQSYMIVLMVTCCIIPLAIIMLCYLQVWLAIRAVAKQQKE--------------- +11== SVELGCQSFMLTLMITCCFLPLFIIIVCYLQVWMAIRAVAAQQKE--------------- +12== SSDPGVQSYMVVLMVTCCFFPLAIIILCYLQVWLAIRAVAAQQKE--------------- +13== GS--NNNSYILSLFVTCFVLPLSLILFSYTNLLLTLRAAAAQQKE--------------- +14== NF--DTRLFVACIFFFSFVCPTTMITYYYSQIVGHVFSHEKALRDQAKKMNVESLRSNV- +15== NF--DTRLFVACIFFFSFVCPTTMITYYYSQIVGHVFSHEKALRDQAKKMNVDSLRSNV- +16== NF--DTRLFVGTIFFFSFVCPTLMILYYYSQIVGHVFSHEKALREQAKKMNVESLRSNV- +17== NF--DTRLFVGTIFLFSFVVPTLMILYYYSQIVGHVFNHEKALREQAKKMNVESLRSNV- +18== DF--NTFSYNIFIFVFDYFLPAAIIVFSYVFIVKAIFAHEAAMRAQAKKMNVSTLRSN-- +19== DM--NTITYNICIFIFDFFLPASVIVFSYVFIVKAIFAHEAAMRAQAKKMNVTNLRSN-- +20== DW--NPRSYLIFYSIFVYYIPLFLICYSYWFIIAAVSAHEKAMREQAKKMNVKSLRSS-- +21== DW--NPRSYLIFYSIFVYYIPLFLICYSYWFIIAAVSAHEKAMREQAKKMNVKSLRSS-- +22== DW--NPRSYLIFYSIFVYYIPLFLICYSYWFIIAAVSAHEKAMREQAKKMNVKSLRSS-- +23== MW--NPRSYLITYSLFVYYTPLFLICYSYWFIIAAVAAHEKAMREQAKKMNVKSLRSS-- +24== QW--NPRSYLITYSLFVYYTPLFMICYSYWFIIATVAAHEKAMRDQAKKMNVKSLRSS-- +25== GL--LSASYLVCYGIWVYFVPLFLIIYSYWFIIQAVAAHEKNMREQAKKMNVASLRSS-- +26== DW--SSASYVVIYGLAVYFLPLITMIYCYFFIVHAVAEHEKQLREQAKKMNVASLRANA- +27== DP--STRSFILCMYFCGFMLPIIIIAFCYFNIVMSVSNHEKEMAAMAKRLNAKELRKA-- +28== DS--TTRSNILCMFILGFFGPILIIFFCYFNIVMSVSNHEKEMAAMAKRLNAKELRKA-- +29== D-----FGYTIYSTAVAFYIPMSVMLFMYYQIYKAARKSAAKHKFP-------------- +30== D-----FGYTIYSTAVAFYIPMSVMLFMYYQIYKAARKSAAKHKFP-------------- +31=p D-----FGYTIYSTAVAFYIPMSVMLFMYYQIYKAARKSAAKHKFP-------------- +32== D-----HGYTIYSTFGAFYIPLLLMLVLYGRIFRAARFRIRKTVKKVEKTGADTRHGASP +33=p D-----HGYTIYSTFGAFYIPLLLMLVLYGRIFRAARFRIRKTVRKVEKKGAGTSLGTSS +34== D-----KGYTIFSTVGAFYLPMLVMMIIYIRIWLVARSRIRKDKFQMTKARLKTEETTLV +35=p D-----KGYTIFSTVGAFYLPMLVMMIIYIRIWLVARSRIRKDKFQMTKARLKTEETTLV +36== D-----VGYQIFATASSFYVPVLIILILYWRIYQTARKRIRRRRGA-------TARGGVG + * : * : + +1== ------------------------------------------------------------ +2== ------------------------------------------------------------ +3== ------------------------------------------------------------ +4=p ------------------------------------------------------------ +5=p ------------------------------------------------------------ +6== ------------------------------------------------------------ +7== ------------------------------------------------------------ +8=opsin, ------------------------------------------------------------ +9== ------------------------------------------------------------ +10== ------------------------------------------------------------ +11== ------------------------------------------------------------ +12== ------------------------------------------------------------ +13== ------------------------------------------------------------ +14== ------------------------------------------------------------ +15== ------------------------------------------------------------ +16== ------------------------------------------------------------ +17== ------------------------------------------------------------ +18== ------------------------------------------------------------ +19== ------------------------------------------------------------ +20== ------------------------------------------------------------ +21== ------------------------------------------------------------ +22== ------------------------------------------------------------ +23== ------------------------------------------------------------ +24== ------------------------------------------------------------ +25== ------------------------------------------------------------ +26== ------------------------------------------------------------ +27== ------------------------------------------------------------ +28== ------------------------------------------------------------ +29== GFPRVE--------------------------------PDSVI----------ALNGIVK +30== GFPRVQ--------------------------------PESVI----------SLNGVVK +31=p GFPRVQ--------------------------------PESVI----------SLNGVVK +32== A-PQPKKS-VNGESGSRNWRLGVESKAGGAL-----C-----------------ANGAVR +33=p A-PPPKKS-LNGQPGSGDWRRCAENRAVGTP-----C-----------------TNGAVR +34== ASPKTEYSVVSDCNGCNSPDSTTEKKKRRAPFKSYGCSPRPERKKNRAKKLPENANGV-- +35=p ASPKTEYSVVSDCNGCNSPDSTTEKKKRRAPFKSYGCSPRPERKKNRAKKLPENANGV-- +36== PPPVPAGGALVAGGGSGGIAAAVVAVIGR---------PLPTISET-------TTTGFTN + + +1== ------------------------------------------------------------ +2== ------------------------------------------------------------ +3== ------------------------------------------------------------ +4=p ------------------------------------------------------------ +5=p ------------------------------------------------------------ +6== ------------------------------------------------------------ +7== ------------------------------------------------------------ +8=opsin, ------------------------------------------------------------ +9== ------------------------------------------------------------ +10== ------------------------------------------------------------ +11== ------------------------------------------------------------ +12== ------------------------------------------------------------ +13== ------------------------------------------------------------ +14== ------------------------------------------------------------ +15== ------------------------------------------------------------ +16== ------------------------------------------------------------ +17== ------------------------------------------------------------ +18== ------------------------------------------------------------ +19== ------------------------------------------------------------ +20== ------------------------------------------------------------ +21== ------------------------------------------------------------ +22== ------------------------------------------------------------ +23== ------------------------------------------------------------ +24== ------------------------------------------------------------ +25== ------------------------------------------------------------ +26== ------------------------------------------------------------ +27== ------------------------------------------------------------ +28== ------------------------------------------------------------ +29== -------------LQKEVEEC-AN------------------LSRLLKHER--------- +30== -------------LQKEVEEC-AN------------------LSRLLKHER--------- +31=p -------------LQKEVEEC-AN------------------LSRLLKHER--------- +32== QGDDGAALEV-----IEVHRV-GNSKEHLPLPSEAGP--TPCAPASFERKNERN------ +33=p QGDDEATLEV-----IEVHRV-GNSKEHLPLPSESGS--NSYAPACLERKNERN------ +34== -NSNSSSSERLKQIQIETAEAFANGC------------AEEASIAMLERQCNNGKKISSN +35=p -NSNSSSSERLKQIQIETAEAFANGC------------AEEASIAMLERQCNNGKKISSN +36== VSSNNTSP--------EKQSC-ANGLEADPPTTGYGAVAAAYYPSLVRRKP--------- + + +1== --------SASTQKAEKEVTRMVVLMVIGFLVCWVPYASVAFYIFT--HQGSDFGAT-FM +2== --------SATTQKAEKEVTRMVIIMVIFFLICWLPYASVAMYIFT--HQGSNFGPI-FM +3== --------SATTQKAEKEVTRMVILMVLGFMLAWTPYAVVAFWIFT--NKGADFTAT-LM +4=p --------SASTQKAEREVTKMVILMVFGFLIAWTPYATVAAWIFF--NKGADFSAK-FM +5=p --------SASTQKAEREVTKMVILMVLGFLVAWTPYATVAAWIFF--NKGAAFSAQ-FM +6== --------SASTQKAEREVTKMVVVMVLGFLVCWAPYASFSLWIVS--HRGEEFDLR-MA +7== --------SATTQKAEREVSRMVVVMVGSFCVCYVPYAAFAMYMVN--NRNHGLDLR-LV +8=opsin, --------SESTQKAEKEVTRMVVVMVLAFC----------------------------- +9== --------SESTQKAEKEVTRMVVVMVLAFCFCWGPYAFFACFAAA--NPGYPFHPL-MA +10== --------SESTQKAEKEVTRMVVVMIFAYCVCWGPYTFFACFAAA--NPGYAFHPL-MA +11== --------SESTQKAEREVSRMVVVMIVAFCICWGPYASFVSFAAA--NPGYAFHPL-AA +12== --------SESTQKAEKEVSRMVVVMIVAYCFCWGPYTFFACFAAA--NPGYAFHPL-AA +13== --------ADTTQRAEREVTRMVIVMVMAFLLCWLPYSTFALVVAT--HKGIIIQPV-LA +14== --------DKNKETAEIRIAKAAITICFLFFCSWTPYGVMSLIGAF--GDKTLLTPG-AT +15== --------DKSKEAAEIRIAKAAITICFLFFASWTPYGVMSLIGAF--GDKTLLTPG-AT +16== --------DKSKETAEIRIAKAAITICFLFFVSWTPYGVMSLIGAF--GDKSLLTQG-AT +17== --------DKSKETAEIRIAKAAITICFLFFVSWTPYGVMSLIGAF--GDKSLLTPG-AT +18== --------EADAQRAEIRIAKTALVNVSLWFICWTPYALISLKGVM--GDTSGITPL-VS +19== --------EAETQRAEIRIAKTALVNVSLWFICWTPYAAITIQGLL--GNAEGITPL-LT +20== --------EDAEKSAEGKLAKVALVTITLWFMAWTPYLVINCMGLF--KF-EGLTPL-NT +21== --------EDAEKSAEGKLAKVALVTITLWFMAWTPYLVINCMGLF--KF-EGLTPL-NT +22== --------EDADKSAEGKLAKVALVTISLWFMAWTPYLVINCMGLF--KF-EGLTPL-NT +23== --------EDCDKSAEGKLAKVALTTISLWFMAWTPYLVICYFGLF--KI-DGLTPL-TT +24== --------EDCDKSAENKLAKVALTTISLWFMAWTPYLIICYFGLF--KI-DGLTPL-TT +25== --------ENQNTSAECKLAKVALMTISLWFMAWTPYLVINFSGIF--NL-VKISPL-FT +26== --------DQQKQSAECRLAKVAMMTVGLWFMAWTPYLIISWAGVF--SSGTRLTPL-AT +27== --------Q-AGASAEMKLAKISMVIITQFMLSWSPYAIIALLAQF--GPAEWVTPY-AA +28== --------Q-AGANAEMRLAKISIVIVSQFLLSWSPYAVVALLAQF--GPLEWVTPY-AA +29== -------KNISIFKREQKAATTLGIIVGAFTVCWLPFFLLSTARPFICGTSCSCIPLWVE +30== -------KNISIFKREQKAATTLGIIVGAFTVCWLPFFLLSTARPFICGTSCSCIPLWVE +31=p -------KNISIFKREQKAATTLGIIVGAFTVCWLPFFLLSTARPFICGTSCSCIPLWVE +32== ----AEAKRKMALARERKTVKTLGIIMGTFILCWLPFFIVALVLPF-CESSCHMPTL-LG +33=p ----AEAKRKMALARERKTVKTLGIIMGTFILCWLPFFIVALVLPF-CESSCHMPAL-LG +34== DTPYSRTREKLELKRERKAARTLAIITGAFLICWLPFFIIALIGPF--VDPEGIPPF-AR +35=p DTPYSRTREKLELKRERKAARTLAIITGAFLICWLPFFIIALIGPF--VDPEGIPPF-AR +36== -------KEAADSKRERKAAKTLAIITGAFVACWLPFFVLAILVPT-CD--CEVSPV-LT + * . : + +1== TLPAFFAKSSALYNPVIYILMNKQFRNCMITTL-----CC-----GKNPLGDDE-SGA-S +2== TLPAFFAKTASIYNPIIYIMMNKQFRNCMLTSL-----CC-----GKNPLGDDE-ASA-T +3== AVPAFFSKSSSLYNPIIYVLMNKQFRNCMITTI-----CC-----GKNPFGDEDVSSTVS +4=p AIPAFFSKSSALYNPVIYVLLNKQFRNCMLTTI-----FC-----GKNPLGDDE-SSTVS +5=p AIPAFFSKTSALYNPVIYVLLNKQFRSCMLTTL-----FC-----GKNPLGDEE-SSTVS +6== TIPSCLSKASTVYNPVIYVLMNKQFRSCMMK-M-----VC-----GKN-IEEDE-AST-S +7== TIPSFFSKSACIYNPIIYCFMNKQFQACIMK-M-----VC-----GKA-MTDES-DTC-S +8=opsin, ------------------------------------------------------------ +9== ALPAFFAKSATIYNPVIYVFMNRQFRNCILQ-L-----F------GKK-VDDGS-ELS-S +10== ALPAYFAKSATIYNPVIYVFMNRQFRNCILQ-L-----F------GKK-VDDGS-ELS-S +11== ALPAYFAKSATIYNPVIYVFMNRQFRNCIMQ-L-----F------GKK-VDDGS-EAS-T +12== ALPAYFAKSATIYNPIIYVFMNRQFRNCILQ-L-----F------GKK-VDDGS-EVS-T +13== SLPSYFSKTATVYNPIIYVFMNKQFQSCLLEML-----CC-----GYQPQRTGKASPGTP +14== MIPACACKMVACIDPFVYAISHPRYRMELQKRCPW---LALN---EK----APE-SSA-V +15== MIPACTCKMVACIDPFVYAISHPRYRMELQKRCPW---LAIS---EK----APE-SRA-A +16== MIPACTCKLVACIDPFVYAISHPRYRLELQKRCPW---LGVN---EK----SGE-ISS-A +17== MIPACTCKLVACIEPFVYAISHPRYRMELQKRCPW---LGVN---EK----SGE-ASS-A +18== TLPALLAKSCSCYNPFVYAISHPKYRLAITQHLPW---FCVH---ET----ETK-SND-D +19== TLPALLAKSCSCYNPFVYAISHPKFRLAITQHLPW---FCVH---EK----DPN-DVE-E +20== IWGACFAKSAACYNPIVYGISHPKYRLALKEKCP----CCVF---GKV--DDGK-SSD-A +21== IWGACFAKSAACYNPIVYGISHPKYRLALKEKCP----CCVF---GKV--DDGK-SSD-A +22== IWGACFAKSAACYNPIVYGISHPKYRLALKEKCP----CCVF---GKV--DDGK-SSE-A +23== IWGATFAKTSAVYNPIVYGISHPKYRIVLKEKCP----MCVF---GNT--DEPK-PDA-P +24== IWGATFAKTSAVYNPIVYGISHPNDRLVLKEKCP----MCVC---GTT--DEPK-PDA-P +25== IWGSLFAKANAVYNPIVYGISHPKYRAALFAKFP----SLAC---AA----EPS-SDA-V +26== IWGSVFAKANSCYNPIVYGISHPRYKAALYQRFP----SLAC---GS---GESG-SDV-K +27== ELPVLFAKASAIHNPIVYSVSHPKFREAIQTTFPWLLTCCQF---DEK--ECED-AND-A +28== QLPVMFAKASAIHNPMIYSVSHPKFREAISQTFPWVLTCCQF---DDK--ETED-DKD-A +29== RTFLWLGYANSLINPFIYAFFNRDLRTTYRSLL-----QCQYRNINRKL------SAAGM +30== RTCLWLGYANSLINPFIYAFFNRDLRPTSRSLL-----QCQYRNINRKL------SAAGM +31=p RTCLWLGYANSLINPFIYAFFNRDLRTTYRSLL-----QCQYRNINRKL------SAAGM +32== AIINWLGYSNSLLNPVIYAYFNKDFQNAFKKII-----KCKF---CRQ------------ +33=p AIINWLGYSNSLLNPVIYAYFNKDFQNAFKKII-----KCKF---CRR------------ +34== SFVLWLGYFNSLLNPIIYTIFSPEFRSAFQKIL-----FGKYR-RGHR------------ +35=p SFVLWLGYFNSLLNPIIYTIFSPEFRSAFQKIL-----FGKYR-RGHR------------ +36== SLSLWLGYFNSTLNPVIYTVFSPEFRHAFQRLL------CGRRVRRRR------------ + + +1== TSKTEVSSVSTS------------------------------------------------ +2== ASKTETSQVA-------------------------------------------------- +3== QSKTEVSSVSSS------------------------------------------------ +4=p TSKTEVSSVS-------------------------------------------------- +5=p TSKTEVSSVS-------------------------------------------------- +6== SQVTQVSSVA-------------------------------------------------- +7== SQKTEVSTVSST------------------------------------------------ +8=opsin, ------------------------------------------------------------ +9== ASKTEVSSVS-------------------------------------------------- +10== ASKTEVSSVS-------------------------------------------------- +11== TSRTEVSSVSNS------------------------------------------------ +12== -SRTEVSSVSNS------------------------------------------------ +13== GPHADVTAAGLR------------------------------------------------ +14== ASTS-TTQEPQ------------------------------------------------- +15== ISTS-TTQEQQ------------------------------------------------- +16== QSTT-TQEQ-Q------------------------------------------------- +17== QSTT-TQEQTQ------------------------------------------------- +18== SQSNSTVAQDK------------------------------------------------- +19== NQSSNTQTQEK------------------------------------------------- +20== QSQA-TASEAE------------------------------------------------- +21== QSQA-TASEAE------------------------------------------------- +22== QSQA-TTSEAE------------------------------------------------- +23== ASDTETTSEAD------------------------------------------------- +24== PSDTETTSEAE------------------------------------------------- +25== STTSGTTTVTDN------------------------------------------------ +26== SEASATTTMEEK------------------------------------------------ +27== EEEV-VASERG--GESRDAAQMKEMMAMMQKMQAQQAAYQPPPPPQGY--PPQGYPPQGA +28== ETEI-PAGESSDAAPSADAAQMKEMMAMMQKMQQQQAAY----PPQGYAPPPQGYPPQG- +29== HEALKLAERPERP-----------------EFVLQNA----------------------- +30== HEALKLAERPERS-----------------EFVLQNS----------------------- +31=p HEALKLAERPERS-----------------EFVLQNS----------------------- +32== ------------------------------------------------------------ +33=p ------------------------------------------------------------ +34== ------------------------------------------------------------ +35=p ------------------------------------------------------------ +36== ------------------------------------------------------------ + + +1== --------------------------------------------PVSP-A--- +2== -----------------------------------------------P-A--- +3== --------------------------------------------QVSP-A--- +4=p -----------------------------------------------P-A--- +5=p -----------------------------------------------P-A--- +6== -----------------------------------------------PEK--- +7== --------------------------------------------QVGP-N--- +8=opsin, ----------------------------------------------------- +9== --------------------------------------------SVSP-A--- +10== --------------------------------------------SVSP-A--- +11== --------------------------------------------SVAP-A--- +12== --------------------------------------------SVSP-A--- +13== -------------------------------------------NKVMP-AHPV +14== --------------------------------------------QTTA-A--- +15== --------------------------------------------QTTA-A--- +16== --------------------------------------------QTTA-A--- +17== --------------------------------------------QTSA-A--- +18== -------------------------------------------------A--- +19== -------------------------------------------------S--- +20== ----------------------------------------------SK-A--- +21== ----------------------------------------------SK-A--- +22== ----------------------------------------------SK-A--- +23== ----------------------------------------------SK-A--- +24== ----------------------------------------------SK-D--- +25== -------------------------------------------EK-SN-A--- +26== -------------------------------------------PKIPE-A--- +27== YPPPQGYPPQGYPPQGYPPQGYPPQGAPPQVEAPQGAPPQGVDNQAYQ-A--- +28== YPP-QGYPPQGYPPQGYPP---PPQGAPPQ-GAPPAAPPQGVDNQAYQ-A--- +29== -------------------------------------------DYCRKKGHDS +30== -------------------------------------------DHCGKKGHDT +31=p -------------------------------------------DHCGKKGHDT +32== ----------------------------------------------------- +33=p ----------------------------------------------------- +34== ----------------------------------------------------- +35=p ----------------------------------------------------- +36== -------------------------------------------------A-PQ +
--- a/test-data/mafft_fftns_result.aln Sat Nov 11 15:06:34 2017 -0500 +++ b/test-data/mafft_fftns_result.aln Wed Apr 15 15:33:37 2020 -0400 @@ -1,504 +1,468 @@ > 1== M63632 1 Lampetra japonica rhodopsin <>[BBRC174,1125-1132'91] ---------------------------------MNGTE--------------GDNF----- --------------YVP-----F-SNKTG----------LARSPYEYPQY-YLAEPWK--- ---------------YSALAAYMFFLILVGFPVNFLTLFVTVQHKKLRTPLNYILLNLAMA -NLFMVLFG-FTVTMYTSMN-GYFV--FGPTMCSIEGFFATLGGEVALWSLVVLAIERYIV -ICKPMGN-FRFGNTHAIMGVAFTWIMALAC-AAPPLVG-W-----SRYIPEGMQCSCGPD -YYTLNPNFNNESYVVYMFVVHFLVPFVIIFFCYGRLLCTV----KE-------------- -------------------------------------------------------AAAAQQ +----------------------------------------MNG----------------T +E--G--DNFYVP----FSNKTGLARSPYEYPQY-------YLAEPWK---------YSAL +AAYMFFLILVGFPVNFLTLFVTVQHKKLRTPLNYILLNLAMANLFMVLFG-FTVTMYTSM +N-GYFV--FGPTMCSIEGFFATLGGEVALWSLVVLAIERYIVICKPMGN-FRFGNTHAIM +GVAFTWIMALAC-AAPPLVG-W-----SRYIPEGMQCSCGPDYYTLNPNFNNESYVVYMF +VVHFLVPFVIIFFCYGRLLCTV----KEAAAAQQ-------------------------- ------------------------------------------------------------ ---------------------ESASTQK------AEKEVTRMVVLMVIGFLVCWVPYASVA -FYIFT-HQGS--DFGATFMTLPAFFAKSSALYNPVIYILMNKQFRNCMITTLCC------ ---GKNPLGDDE--SGASTSKTEVSSVS-TSPVS--------------------------- ------------------------------------PA----------------------- --- +------------------------------------------------------------ +-------------ESASTQK------AEKEVTRMVVLMVIGFLVCWVPYASVAFYIFT-H +QGS--DFGATFMTLPAFFAKSSALYNPVIYILMNKQFRNCMITTLCC--------GKNPL +GDDE--SGASTSKTEVSSVS-TSPVSPA-------------------------------- +--------------------------------------------------------- > 2== U22180 1 rat opsin <rod>[J.Mol.Neurosci.5(3),207-209'94] ---------------------------------MNGTE--------------GPNF----- --------------YVP-----F-SNITG----------VVRSPFEQPQY-YLAEPWQ--- ---------------FSMLAAYMFLLIVLGFPINFLTLYVTVQHKKLRTPLNYILLNLAVA -DLFMVFGG-FTTTLYTSLH-GYFV--FGPTGCNLEGFFATLGGEIGLWSLVVLAIERYVV -VCKPMSN-FRFGENHAIMGVAFTWVMALAC-AAPPLVG-W-----SRYIPEGMQCSCGID -YYTLKPEVNNESFVIYMFVVHFTIPMIVIFFCYGQLVFTV----KE-------------- -------------------------------------------------------AAAQQQ +----------------------------------------MNG----------------T +E--G--PNFYVP----FSNITGVVRSPFEQPQY-------YLAEPWQ---------FSML +AAYMFLLIVLGFPINFLTLYVTVQHKKLRTPLNYILLNLAVADLFMVFGG-FTTTLYTSL +H-GYFV--FGPTGCNLEGFFATLGGEIGLWSLVVLAIERYVVVCKPMSN-FRFGENHAIM +GVAFTWVMALAC-AAPPLVG-W-----SRYIPEGMQCSCGIDYYTLKPEVNNESFVIYMF +VVHFTIPMIVIFFCYGQLVFTV----KEAAAQQQ-------------------------- ------------------------------------------------------------ ---------------------ESATTQK------AEKEVTRMVIIMVIFFLICWLPYASVA -MYIFT-HQGS--NFGPIFMTLPAFFAKTASIYNPIIYIMMNKQFRNCMLTSLCC------ ---GKNPLGDDE--ASATASKTE------TSQVA--------------------------- ------------------------------------PA----------------------- --- +------------------------------------------------------------ +-------------ESATTQK------AEKEVTRMVIIMVIFFLICWLPYASVAMYIFT-H +QGS--NFGPIFMTLPAFFAKTASIYNPIIYIMMNKQFRNCMLTSLCC--------GKNPL +GDDE--ASATASKTE------TSQVAPA-------------------------------- +--------------------------------------------------------- > 3== M92038 1 chicken green sensitive cone opsin <retina>[PNAS89,5932-5936'9 ---------------------------------MNGTE--------------GINF----- --------------YVP-----M-SNKTG----------VVRSPFEYPQY-YLAEPWK--- ---------------YRLVCCYIFFLISTGLPINLLTLLVTFKHKKLRQPLNYILVNLAVA -DLFMACFG-FTVTFYTAWN-GYFV--FGPVGCAVEGFFATLGGQVALWSLVVLAIERYIV -VCKPMGN-FRFSATHAMMGIAFTWVMAFSC-AAPPLFG-W-----SRYMPEGMQCSCGPD -YYTHNPDYHNESYVLYMFVIHFIIPVVVIFFSYGRLICKV----RE-------------- -------------------------------------------------------AAAQQQ +----------------------------------------MNG----------------T +E--G--INFYVP----MSNKTGVVRSPFEYPQY-------YLAEPWK---------YRLV +CCYIFFLISTGLPINLLTLLVTFKHKKLRQPLNYILVNLAVADLFMACFG-FTVTFYTAW +N-GYFV--FGPVGCAVEGFFATLGGQVALWSLVVLAIERYIVVCKPMGN-FRFSATHAMM +GIAFTWVMAFSC-AAPPLFG-W-----SRYMPEGMQCSCGPDYYTHNPDYHNESYVLYMF +VIHFIIPVVVIFFSYGRLICKV----REAAAQQQ-------------------------- ------------------------------------------------------------ ---------------------ESATTQK------AEKEVTRMVILMVLGFMLAWTPYAVVA -FWIFT-NKGA--DFTATLMAVPAFFSKSSSLYNPIIYVLMNKQFRNCMITTICC------ ---GKNPFGDEDVSSTVSQSKTEVSSVS-SSQVS--------------------------- ------------------------------------PA----------------------- --- +------------------------------------------------------------ +-------------ESATTQK------AEKEVTRMVILMVLGFMLAWTPYAVVAFWIFT-N +KGA--DFTATLMAVPAFFSKSSSLYNPIIYVLMNKQFRNCMITTICC--------GKNPF +GDEDVSSTVSQSKTEVSSVS-SSQVSPA-------------------------------- +--------------------------------------------------------- > 4=p A45229 opsin, green-sensitive (clone GFgr-1) - goldfish ---------------------------------MNGTE--------------GKNF----- --------------YVP-----M-SNRTG----------LVRSPFEYPQY-YLAEPWQ--- ---------------FKILALYLFFLMSMGLPINGLTLVVTAQHKKLRQPLNFILVNLAVA -GTIMVCFG-FTVTFYTAIN-GYFV--LGPTGCAVEGFMATLGGEVALWSLVVLAIERYIV -VCKPMGS-FKFSSSHAFAGIAFTWVMALAC-AAPPLFG-W-----SRYIPEGMQCSCGPD -YYTLNPDYNNESYVIYMFVCHFILPVAVIFFTYGRLVCTV----KA-------------- -------------------------------------------------------AAAQQQ +----------------------------------------MNG----------------T +E--G--KNFYVP----MSNRTGLVRSPFEYPQY-------YLAEPWQ---------FKIL +ALYLFFLMSMGLPINGLTLVVTAQHKKLRQPLNFILVNLAVAGTIMVCFG-FTVTFYTAI +N-GYFV--LGPTGCAVEGFMATLGGEVALWSLVVLAIERYIVVCKPMGS-FKFSSSHAFA +GIAFTWVMALAC-AAPPLFG-W-----SRYIPEGMQCSCGPDYYTLNPDYNNESYVIYMF +VCHFILPVAVIFFTYGRLVCTV----KAAAAQQQ-------------------------- ------------------------------------------------------------ ---------------------DSASTQK------AEREVTKMVILMVFGFLIAWTPYATVA -AWIFF-NKGA--DFSAKFMAIPAFFSKSSALYNPVIYVLLNKQFRNCMLTTIFC------ ---GKNPLGDDE-SSTVSTSKTEVSS------VS--------------------------- ------------------------------------PA----------------------- --- +------------------------------------------------------------ +-------------DSASTQK------AEREVTKMVILMVFGFLIAWTPYATVAAWIFF-N +KGA--DFSAKFMAIPAFFSKSSALYNPVIYVLLNKQFRNCMLTTIFC--------GKNPL +GDDE-SSTVSTSKTEVSS------VSPA-------------------------------- +--------------------------------------------------------- > 5=p B45229 opsin, green-sensitive (clone GFgr-2) - goldfish ---------------------------------MNGTE--------------GNNF----- --------------YVP-----L-SNRTG----------LVRSPFEYPQY-YLAEPWQ--- ---------------FKLLAVYMFFLICLGLPINGLTLICTAQHKKLRQPLNFILVNLAVA -GAIMVCFG-FTVTFYTAIN-GYFA--LGPTGCAVEGFMATLGGEVALWSLVVLAIERYIV -VCKPMGS-FKFSSTHASAGIAFTWVMAMAC-AAPPLVG-W-----SRYIPEGIQCSCGPD -YYTLNPEYNNESYVLYMFICHFILPVTIIFFTYGRLVCTV----KA-------------- -------------------------------------------------------AAAQQQ +----------------------------------------MNG----------------T +E--G--NNFYVP----LSNRTGLVRSPFEYPQY-------YLAEPWQ---------FKLL +AVYMFFLICLGLPINGLTLICTAQHKKLRQPLNFILVNLAVAGAIMVCFG-FTVTFYTAI +N-GYFA--LGPTGCAVEGFMATLGGEVALWSLVVLAIERYIVVCKPMGS-FKFSSTHASA +GIAFTWVMAMAC-AAPPLVG-W-----SRYIPEGIQCSCGPDYYTLNPEYNNESYVLYMF +ICHFILPVTIIFFTYGRLVCTV----KAAAAQQQ-------------------------- ------------------------------------------------------------ ---------------------DSASTQK------AEREVTKMVILMVLGFLVAWTPYATVA -AWIFF-NKGA--AFSAQFMAIPAFFSKTSALYNPVIYVLLNKQFRSCMLTTLFC------ ---GKNPLGDEE-SSTVSTSKTEVSS------VS--------------------------- ------------------------------------PA----------------------- --- +------------------------------------------------------------ +-------------DSASTQK------AEREVTKMVILMVLGFLVAWTPYATVAAWIFF-N +KGA--AFSAQFMAIPAFFSKTSALYNPVIYVLLNKQFRSCMLTTLFC--------GKNPL +GDEE-SSTVSTSKTEVSS------VSPA-------------------------------- +--------------------------------------------------------- > 6== L11864 1 Carassius auratus blue cone opsin <retina>[Biochemistry32,208- ---------------------------------MKQVPEF------------HEDF----- --------------YIPIP-LDI-NNLS------------AYSPFLVPQD-HLGNQGI--- ---------------FMAMSVFMFFIFIGGASINILTILCTIQFKKLRSHLNYILVNLSIA -NLFVAIFG-SPLSFYSFFN-RYFI--FGATACKIEGFLATLGGMVGLWSLAVVAFERWLV -ICKPLGN-FTFKTPHAIAGCILPWISALAA-SLPPLFG-W-----SRYIPEGLQCSCGPD -WYTTNNKYNNESYVMFLFCFCFAVPFGTIVFCYGQLLITL----KL-------------- -------------------------------------------------------AAKAQA +----------------------------------------MKQ----------------V +PEFH--EDFYIPIPLDINNLS--AYSPFLVPQD-------HLGNQGI---------FMAM +SVFMFFIFIGGASINILTILCTIQFKKLRSHLNYILVNLSIANLFVAIFG-SPLSFYSFF +N-RYFI--FGATACKIEGFLATLGGMVGLWSLAVVAFERWLVICKPLGN-FTFKTPHAIA +GCILPWISALAA-SLPPLFG-W-----SRYIPEGLQCSCGPDWYTTNNKYNNESYVMFLF +CFCFAVPFGTIVFCYGQLLITL----KLAAKAQA-------------------------- ------------------------------------------------------------ ---------------------DSASTQK------AEREVTKMVVVMVLGFLVCWAPYASFS -LWIVS-HRGE--EFDLRMATIPSCLSKASTVYNPVIYVLMNKQFRSCMM-KMVC------ ---GKN-IEEDE--ASTSSQVTQVSS------VA--------------------------- ------------------------------------PEK---------------------- --- +------------------------------------------------------------ +-------------DSASTQK------AEREVTKMVVVMVLGFLVCWAPYASFSLWIVS-H +RGE--EFDLRMATIPSCLSKASTVYNPVIYVLMNKQFRSCMM-KMVC--------GKN-I +EEDE--ASTSSQVTQVSS------VAPEK------------------------------- +--------------------------------------------------------- > 7== M13299 1 human BCP <>[Science232(4747),193-202'86] ---------------------------------MRKMS--------------EEEF----- --------------YL------F-KNIS------------SVGPWDGPQY-HIAPVWA--- ---------------FYLQAAFMGTVFLIGFPLNAMVLVATLRYKKLRQPLNYILVNVSFG -GFLLCIFS-VFPVFVASCN-GYFV--FGRHVCALEGFLGTVAGLVTGWSLAFLAFERYIV -ICKPFGN-FRFSSKHALTVVLATWTIGIGV-SIPPFFG-W-----SRFIPEGLQCSCGPD -WYTVGTKYRSESYTWFLFIFCFIVPLSLICFSYTQLLRAL----KA-------------- -------------------------------------------------------VAAQQQ +----------------------------------------MRK----------------M +S--E--EEFYL-----FKNIS--SVGPWDGPQY-------HIAPVWA---------FYLQ +AAFMGTVFLIGFPLNAMVLVATLRYKKLRQPLNYILVNVSFGGFLLCIFS-VFPVFVASC +N-GYFV--FGRHVCALEGFLGTVAGLVTGWSLAFLAFERYIVICKPFGN-FRFSSKHALT +VVLATWTIGIGV-SIPPFFG-W-----SRFIPEGLQCSCGPDWYTVGTKYRSESYTWFLF +IFCFIVPLSLICFSYTQLLRAL----KAVAAQQQ-------------------------- ------------------------------------------------------------ ---------------------ESATTQK------AEREVSRMVVVMVGSFCVCYVPYAAFA -MYMVN-NRNH--GLDLRLVTIPSFFSKSACIYNPIIYCFMNKQFQACIM-KMVC------ ---GKA-MTDES--DTCSSQKTEVSTVS-STQVG--------------------------- ------------------------------------PN----------------------- --- +------------------------------------------------------------ +-------------ESATTQK------AEREVSRMVVVMVGSFCVCYVPYAAFAMYMVN-N +RNH--GLDLRLVTIPSFFSKSACIYNPIIYCFMNKQFQACIM-KMVC--------GKA-M +TDES--DTCSSQKTEVSTVS-STQVGPN-------------------------------- +--------------------------------------------------------- > 8=opsin, greensensitive human (fragment) S07060 ------------------------------------------------------------ ------------------------------------------------------------ +------------------------------------------DLAETVIA-STISIVNQV +S-GYFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWLVVCKPFGN-VRFDAKLAIV +GIAFSWIWAAVW-TAPPIFG-W-----SRYWPHGLKTSCGPDVFSGSSYPGVQSYMIVLM +VTCCITPLSIIVLCYLQVWLAI----RAVAKQQK-------------------------- ------------------------------------------------------------ -DLAETVIA-STISIVNQVS-GYFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWLV -VCKPFGN-VRFDAKLAIVGIAFSWIWAAVW-TAPPIFG-W-----SRYWPHGLKTSCGPD -VFSGSSYPGVQSYMIVLMVTCCITPLSIIVLCYLQVWLAI----RA-------------- -------------------------------------------------------VAKQQK +------------------------------------------------------------ +-------------ESESTQK------AEKEVTRMVVVMVLAFC----------------- +------------------------------------------------------------ +------------------------------------------------------------ +--------------------------------------------------------- +> 9== K03494 1 human GCP <>[Science232(4747),193-202'86] +----------------------------------------MAQQWSLQRLAGRHPQDSYE +DSTQ--SSIFT-----YTNSNS-TRGPFEGPNY-------HIAPRWV---------YHLT +SVWMIFVVIASVFTNGLVLAATMKFKKLRHPLNWILVNLAVADLAETVIA-STISVVNQV +Y-GYFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWMVVCKPFGN-VRFDAKLAIV +GIAFSWIWAAVW-TAPPIFG-W-----SRYWPHGLKTSCGPDVFSGSSYPGVQSYMIVLM +VTCCITPLSIIVLCYLQVWLAI----RAVAKQQK-------------------------- +------------------------------------------------------------ +------------------------------------------------------------ +-------------ESESTQK------AEKEVTRMVVVMVLAFCFCWGPYAFFACFAAA-N +PGY--PFHPLMAALPAFFAKSATIYNPVIYVFMNRQFRNCIL-QLF---------GKK-V +DDGS--ELSSASKTEVSSV---SSVSPA-------------------------------- +--------------------------------------------------------- +> 10== Z68193 1 human Red Opsin <>[] +----------------------------------------MAQQWSLQRLAGRHPQDSYE +DSTQ--SSIFT-----YTNSNS-TRGPFEGPNY-------HIAPRWV---------YHLT +SVWMIFVVTASVFTNGLVLAATMKFKKLRHPLNWILVNLAVADLAETVIA-STISIVNQV +S-GYFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWLVVCKPFGN-VRFDAKLAIV +GIAFSWIWSAVW-TAPPIFG-W-----SRYWPHGLKTSCGPDVFSGSSYPGVQSYMIVLM +VTCCIIPLAIIMLCYLQVWLAI----RAVAKQQK-------------------------- +------------------------------------------------------------ ------------------------------------------------------------ ---------------------ESESTQK------AEKEVTRMVVVMVLAFC---------- +-------------ESESTQK------AEKEVTRMVVVMIFAYCVCWGPYTFFACFAAA-N +PGY--AFHPLMAALPAYFAKSATIYNPVIYVFMNRQFRNCIL-QLF---------GKK-V +DDGS--ELSSASKTEVSSV---SSVSPA-------------------------------- +--------------------------------------------------------- +> 11== M92036 1 Gecko gecko P521 <retina>[PNAS89,6841-6845'92] +----------------------------------------MTEAWNVAVFAARRSRDD-D +DTTR--GSVFT-----YTNTNN-TRGPFEGPNY-------HIAPRWV---------YNLV +SFFMIIVVIASCFTNGLVLVATAKFKKLRHPLNWILVNLAFVDLVETLVA-STISVFNQI +F-GYFI--LGHPLCVIEGYVVSSCGITGLWSLAIISWERWFVVCKPFGN-IKFDSKLAII +GIVFSWVWAWGW-SAPPIFG-W-----SRYWPHGLKTSCGPDVFSGSVELGCQSFMLTLM +ITCCFLPLFIIIVCYLQVWMAI----RAVAAQQK-------------------------- +------------------------------------------------------------ ------------------------------------------------------------ +-------------ESESTQK------AEREVSRMVVVMIVAFCICWGPYASFVSFAAA-N +PGY--AFHPLAAALPAYFAKSATIYNPVIYVFMNRQFRNCIM-QLF---------GKK-V +DDGS--EASTTSRTEVSSVS-NSSVAPA-------------------------------- +--------------------------------------------------------- +> 12== M62903 1 chicken visual pigment <>[BBRC173,1212-1217'90] +----------------------------------------MAA-WEAAFAARRRHEE--E +DTTR--DSVFT-----YTNSNN-TRGPFEGPNY-------HIAPRWV---------YNLT +SVWMIFVVAASVFTNGLVLVATWKFKKLRHPLNWILVNLAVADLGETVIA-STISVINQI +S-GYFI--LGHPMCVVEGYTVSACGITALWSLAIISWERWFVVCKPFGN-IKFDGKLAVA +GILFSWLWSCAW-TAPPIFG-W-----SRYWPHGLKTSCGPDVFSGSSDPGVQSYMVVLM +VTCCFFPLAIIILCYLQVWLAI----RAVAAQQK-------------------------- +------------------------------------------------------------ +------------------------------------------------------------ +-------------ESESTQK------AEKEVSRMVVVMIVAYCFCWGPYTFFACFAAA-N +PGY--AFHPLAAALPAYFAKSATIYNPIIYVFMNRQFRNCIL-QLF---------GKK-V +DDGS--EVST-SRTEVSSVS-NSSVSPA-------------------------------- +--------------------------------------------------------- +> 13== S75720 1 chicken P-opsin <>[Science267(5203),1502-1506'95] +----------------------------------------MS-----------------S +NSSQ--AP-----------PNG-TPGPFDGPQW------PYQAPQST---------YVGV +AVLMGTVVACASVVNGLVIVVSICYKKLRSPLNYILVNLAVADLLVTLCG-SSVSLSNNI +N-GFFV--FGRRMCELEGFMVSLTGIVGLWSLAILALERYVVVCKPLGD-FQFQRRHAVS +GCAFTWGWALLW-SAPPLLG-W-----SSYVPEGLRTSCGPNWYTGGSNN--NSYILSLF +VTCFVLPLSLILFSYTNLLLTL----RAAAAQQK-------------------------- ------------------------------------------------------------ ------------------------------------------------------------ --- -> 9== K03494 1 human GCP <>[Science232(4747),193-202'86] ---------------------------------MAQQWSLQRLAGRHPQDSYEDST----- --------------QSSI--FTY-TNSNS-----------TRGPFEGPNY-HIAPRWV--- ---------------YHLTSVWMIFVVIASVFTNGLVLAATMKFKKLRHPLNWILVNLAVA -DLAETVIA-STISVVNQVY-GYFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWMV -VCKPFGN-VRFDAKLAIVGIAFSWIWAAVW-TAPPIFG-W-----SRYWPHGLKTSCGPD -VFSGSSYPGVQSYMIVLMVTCCITPLSIIVLCYLQVWLAI----RA-------------- -------------------------------------------------------VAKQQK ------------------------------------------------------------- ---------------------ESESTQK------AEKEVTRMVVVMVLAFCFCWGPYAFFA -CFAAA-NPGY--PFHPLMAALPAFFAKSATIYNPVIYVFMNRQFRNCIL-QLF------- ---GKK-VDDGS--ELSSASKTEVSSV---SSVS--------------------------- ------------------------------------PA----------------------- --- -> 10== Z68193 1 human Red Opsin <>[] ---------------------------------MAQQWSLQRLAGRHPQDSYEDST----- --------------QSSI--FTY-TNSNS-----------TRGPFEGPNY-HIAPRWV--- ---------------YHLTSVWMIFVVTASVFTNGLVLAATMKFKKLRHPLNWILVNLAVA -DLAETVIA-STISIVNQVS-GYFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWLV -VCKPFGN-VRFDAKLAIVGIAFSWIWSAVW-TAPPIFG-W-----SRYWPHGLKTSCGPD -VFSGSSYPGVQSYMIVLMVTCCIIPLAIIMLCYLQVWLAI----RA-------------- -------------------------------------------------------VAKQQK ------------------------------------------------------------- ---------------------ESESTQK------AEKEVTRMVVVMIFAYCVCWGPYTFFA -CFAAA-NPGY--AFHPLMAALPAYFAKSATIYNPVIYVFMNRQFRNCIL-QLF------- ---GKK-VDDGS--ELSSASKTEVSSV---SSVS--------------------------- ------------------------------------PA----------------------- --- -> 11== M92036 1 Gecko gecko P521 <retina>[PNAS89,6841-6845'92] ---------------------------------MTEAWNVAVFAARRSRDD-DDTT----- --------------RGSV--FTY-TNTNN-----------TRGPFEGPNY-HIAPRWV--- ---------------YNLVSFFMIIVVIASCFTNGLVLVATAKFKKLRHPLNWILVNLAFV -DLVETLVA-STISVFNQIF-GYFI--LGHPLCVIEGYVVSSCGITGLWSLAIISWERWFV -VCKPFGN-IKFDSKLAIIGIVFSWVWAWGW-SAPPIFG-W-----SRYWPHGLKTSCGPD -VFSGSVELGCQSFMLTLMITCCFLPLFIIIVCYLQVWMAI----RA-------------- -------------------------------------------------------VAAQQK ------------------------------------------------------------- ---------------------ESESTQK------AEREVSRMVVVMIVAFCICWGPYASFV -SFAAA-NPGY--AFHPLAAALPAYFAKSATIYNPVIYVFMNRQFRNCIM-QLF------- ---GKK-VDDGS--EASTTSRTEVSSVS-NSSVA--------------------------- ------------------------------------PA----------------------- --- -> 12== M62903 1 chicken visual pigment <>[BBRC173,1212-1217'90] ---------------------------------MAA-WEAAFAARRRHEE--EDTT----- --------------RDSV--FTY-TNSNN-----------TRGPFEGPNY-HIAPRWV--- ---------------YNLTSVWMIFVVAASVFTNGLVLVATWKFKKLRHPLNWILVNLAVA -DLGETVIA-STISVINQIS-GYFI--LGHPMCVVEGYTVSACGITALWSLAIISWERWFV -VCKPFGN-IKFDGKLAVAGILFSWLWSCAW-TAPPIFG-W-----SRYWPHGLKTSCGPD -VFSGSSDPGVQSYMVVLMVTCCFFPLAIIILCYLQVWLAI----RA-------------- -------------------------------------------------------VAAQQK ------------------------------------------------------------- ---------------------ESESTQK------AEKEVSRMVVVMIVAYCFCWGPYTFFA -CFAAA-NPGY--AFHPLAAALPAYFAKSATIYNPIIYVFMNRQFRNCIL-QLF------- ---GKK-VDDGS--EVST-SRTEVSSVS-NSSVS--------------------------- ------------------------------------PA----------------------- --- -> 13== S75720 1 chicken P-opsin <>[Science267(5203),1502-1506'95] ---------------------------------MS-----------------SNSS----- --------------QAP---------PNG-----------TPGPFDGPQWPYQAPQST--- ---------------YVGVAVLMGTVVACASVVNGLVIVVSICYKKLRSPLNYILVNLAVA -DLLVTLCG-SSVSLSNNIN-GFFV--FGRRMCELEGFMVSLTGIVGLWSLAILALERYVV -VCKPLGD-FQFQRRHAVSGCAFTWGWALLW-SAPPLLG-W-----SSYVPEGLRTSCGPN -WYTGGSNN--NSYILSLFVTCFVLPLSLILFSYTNLLLTL----RA-------------- -------------------------------------------------------AAAQQK ------------------------------------------------------------- ---------------------EADTTQR------AEREVTRMVIVMVMAFLLCWLPYSTFA -LVVAT-HKGI--IIQPVLASLPSYFSKTATVYNPIIYVFMNKQFQSCLL-EMLCCGY--- --QPQR-TGKAS--PGTPGPHADVTAAGLRNKVM--------------------------- ------------------------------------PAHPV-------------------- --- +-------------EADTTQR------AEREVTRMVIVMVMAFLLCWLPYSTFALVVAT-H +KGI--IIQPVLASLPSYFSKTATVYNPIIYVFMNKQFQSCLL-EMLCCGY----QPQR-T +GKAS--PGTPGPHADVTAAGLRNKVMPAHPV----------------------------- +--------------------------------------------------------- > 14== M17718 1 D.melanogaster Rh3 <>[J.Neurosci.7,1550-1557'87] -----------MES--GNV-----------SSSLFGNVSTAL----------RPEA----- --------------RLSA------ETRLL----------GWNVPPEELR--HIPEHWLTYP -E--------PPESMNYLLGTLYIFFTLMSMLGNGLVIWVFSAAKSLRTPSNILVINLAFC -DFMMMVK--TPIFIYNSFH-QGYA--LGHLGCQIFGIIGSYTGIAAGATNAFIAYDRFNV -ITRPMEG--KMTHGKAIAMIIFIYMYATPW-VVACYTETW-----GRFVPEGYLTSCTFD -YLT--DNFDTRLFVACIFFFSFVCPTTMITYYYSQIVGHVFSHEKA-------------- -------------------------------------------------------LRDQAK -KMN---------------VESLRS------------------------------------ --------------------NVDKNKET------AEIRIAKAAITICFLFFCSWTPYGVMS -LIGAF-GDKT--LLTPGATMIPACACKMVACIDPFVYAISHPRYRMELQKRCPWLAL--- ----NE-KAPES----SAVASTSTTQEPQQTTAA--------------------------- ------------------------------------------------------------- --- +----------MESGNVSS------------SLFGNVST-ALRP----------------E +ARLS--A----------ETRLLGWNVPPEELR--------HIPEHWLTYPEPPESMNYLL +GTLYIFFTLMSMLGNGLVIWVFSAAKSLRTPSNILVINLAFCDFMMMVK--TPIFIYNSF +H-QGYA--LGHLGCQIFGIIGSYTGIAAGATNAFIAYDRFNVITRPMEG--KMTHGKAIA +MIIFIYMYATPW-VVACYTETW-----GRFVPEGYLTSCTFDYLT--DNFDTRLFVACIF +FFSFVCPTTMITYYYSQIVGHVFSHEKALRDQAKK------------------------- +--------------------------------------------------MN-------- +--VESL------------------------------------------------------ +----------RSNVDKNKET------AEIRIAKAAITICFLFFCSWTPYGVMSLIGAF-G +DKT--LLTPGATMIPACACKMVACIDPFVYAISHPRYRMELQKRCPWLAL---------N +EKAP--ESSAVASTSTTQEP--QQTTAA-------------------------------- +--------------------------------------------------------- > 15== X65879 1 Drosophila pseudoobscura Dpse\Rh3 <>[Genetics132(1),193-204'92 -----------MEY--HNV-----------SSVL-GNVSSVL----------RPDA----- --------------RLSA------ESRLL----------GWNVPPDELR--HIPEHWLIYP -E--------PPESMNYLLGTLYIFFTVISMIGNGLVMWVFSAAKSLRTPSNILVINLAFC -DFMMMIK--TPIFIYNSFH-QGYA--LGHLGCQIFGVIGSYTGIAAGATNAFIAYDRYNV -ITRPMEG--KMTHGKAIAMIIFIYLYATPW-VVACYTESW-----GRFVPEGYLTSCTFD -YLT--DNFDTRLFVACIFFFSFVCPTTMITYYYSQIVGHVFSHEKA-------------- -------------------------------------------------------LRDQAK -KMN---------------VDSLRS------------------------------------ --------------------NVDKSKEA------AEIRIAKAAITICFLFFASWTPYGVMS -LIGAF-GDKT--LLTPGATMIPACTCKMVACIDPFVYAISHPRYRMELQKRCPWLAI--- ----SE-KAPES----RAAISTSTTQEQQQTTAA--------------------------- ------------------------------------------------------------- --- +----------MEYHNVSS------------VL-GNVSS-VLRP----------------D +ARLS--A----------ESRLLGWNVPPDELR--------HIPEHWLIYPEPPESMNYLL +GTLYIFFTVISMIGNGLVMWVFSAAKSLRTPSNILVINLAFCDFMMMIK--TPIFIYNSF +H-QGYA--LGHLGCQIFGVIGSYTGIAAGATNAFIAYDRYNVITRPMEG--KMTHGKAIA +MIIFIYLYATPW-VVACYTESW-----GRFVPEGYLTSCTFDYLT--DNFDTRLFVACIF +FFSFVCPTTMITYYYSQIVGHVFSHEKALRDQAKK------------------------- +--------------------------------------------------MN-------- +--VDSL------------------------------------------------------ +----------RSNVDKSKEA------AEIRIAKAAITICFLFFASWTPYGVMSLIGAF-G +DKT--LLTPGATMIPACTCKMVACIDPFVYAISHPRYRMELQKRCPWLAI---------S +EKAP--ESRAAISTSTTQEQ--QQTTAA-------------------------------- +--------------------------------------------------------- > 16== M17730 1 D.melanogaster Rh4 opsin <>[J.Neurosci.7,1558-1566'87] -----------ME-------------------PLCNASEPPL----------RPEA----- --------------R-SSG---NGDLQFL----------GWNVPPDQIQ--YIPEHWLTQL -E--------PPASMHYMLGVFYIFLFCASTVGNGMVIWIFSTSKSLRTPSNMFVLNLAVF -DLIMCLK--APIF--NSFH-RGFAIYLGNTWCQIFASIGSYSGIGAGMTNAAIGYDRYNV -ITKPMNR--NMTFTKAVIMNIIIWLYCTPW-VVLPLTQFW-----DRFVPEGYLTSCSFD -YLS--DNFDTRLFVGTIFFFSFVCPTLMILYYYSQIVGHVFSHEKA-------------- -------------------------------------------------------LREQAK -KMN---------------VESLRS------------------------------------ --------------------NVDKSKET------AEIRIAKAAITICFLFFVSWTPYGVMS -LIGAF-GDKS--LLTQGATMIPACTCKLVACIDPFVYAISHPRYRLELQKRCPWLGV--- ----NE-KSGEI----SSAQSTTTQEQ-QQTTAA--------------------------- ------------------------------------------------------------- --- +----------ME------------------PL-CNASEPPLRP----------------E +AR-S--SG---N----GDLQFLGWNVPPDQIQ--------YIPEHWLTQLEPPASMHYML +GVFYIFLFCASTVGNGMVIWIFSTSKSLRTPSNMFVLNLAVFDLIMCLK--APIF--NSF +H-RGFAIYLGNTWCQIFASIGSYSGIGAGMTNAAIGYDRYNVITKPMNR--NMTFTKAVI +MNIIIWLYCTPW-VVLPLTQFW-----DRFVPEGYLTSCSFDYLS--DNFDTRLFVGTIF +FFSFVCPTLMILYYYSQIVGHVFSHEKALREQAKK------------------------- +--------------------------------------------------MN-------- +--VESL------------------------------------------------------ +----------RSNVDKSKET------AEIRIAKAAITICFLFFVSWTPYGVMSLIGAF-G +DKS--LLTQGATMIPACTCKLVACIDPFVYAISHPRYRLELQKRCPWLGV---------N +EKSG--EISSAQST-TTQEQ--QQTTAA-------------------------------- +--------------------------------------------------------- > 17== X65880 1 Drosophila pseudoobscura Dpse\Rh4 <>[Genetics132(1),193-204'92 -----------MD-------------------ALCNASEPPL----------RPEA----- --------------RMSSG---SDELQFL----------GWNVPPDQIQ--YIPEHWLTQL -E--------PPASMHYMLGVFYIFLFFASTLGNGMVIWIFSTSKSLRTPSNMFVLNLAVF -DLIMCLK--APIFIYNSFH-RGFA--LGNTWCQIFASIGSYSGIGAGMTNAAIGYDRYNV -ITKPMNR--NMTFTKAVIMNIIIWLYCTPW-VVLPLTQFW-----DRFVPEGYLTSCSFD -YLS--DNFDTRLFVGTIFLFSFVVPTLMILYYYSQIVGHVFNHEKA-------------- -------------------------------------------------------LREQAK -KMN---------------VESLRS------------------------------------ --------------------NVDKSKET------AEIRIAKAAITICFLFFVSWTPYGVMS -LIGAF-GDKS--LLTPGATMIPACTCKLVACIEPFVYAISHPRYRMELQKRCPWLGV--- ----NE-KSGEA----SSAQSTTTQEQTQQTSAA--------------------------- ------------------------------------------------------------- --- +----------MD------------------AL-CNASEPPLRP----------------E +ARMS--SG---S----DELQFLGWNVPPDQIQ--------YIPEHWLTQLEPPASMHYML +GVFYIFLFFASTLGNGMVIWIFSTSKSLRTPSNMFVLNLAVFDLIMCLK--APIFIYNSF +H-RGFA--LGNTWCQIFASIGSYSGIGAGMTNAAIGYDRYNVITKPMNR--NMTFTKAVI +MNIIIWLYCTPW-VVLPLTQFW-----DRFVPEGYLTSCSFDYLS--DNFDTRLFVGTIF +LFSFVVPTLMILYYYSQIVGHVFNHEKALREQAKK------------------------- +--------------------------------------------------MN-------- +--VESL------------------------------------------------------ +----------RSNVDKSKET------AEIRIAKAAITICFLFFVSWTPYGVMSLIGAF-G +DKS--LLTPGATMIPACTCKLVACIEPFVYAISHPRYRMELQKRCPWLGV---------N +EKSG--EASSAQST-TTQEQ-TQQTSAA-------------------------------- +--------------------------------------------------------- > 18== D50584 1 Hemigrapsus sanguineus opsin BcRh2 <compound eye>[J.Exp.Biol.1 ---------------------------------MTNATGPQM----------AYYG----- --------------AASMD-FGYPEGVSI----------VDFVRPEIKP--YVHQHWYNYP -P--------VNPMWHYLLGVIYLFLGTVSIFGNGLVIYLFNKSAALRTPANILVVNLALS -DLIMLTTN-VPFFTYNCFSGGVWM--FSPQYCEIYACLGAITGVCSIWLLCMISFDRYNI -ICNGFNG-PKLTTGKAVVFALISWVIAIGC-ALPPFFG-W-----GNYILEGILDSCSYD -YLT--QDFNTFSYNIFIFVFDYFLPAAIIVFSYVFIVKAIFAHEAA-------------- -------------------------------------------------------MRAQAK -KMN---------------VSTLRS------------------------------------ ---------------------NEADAQR------AEIRIAKTALVNVSLWFICWTPYALIS -LKGVM-GDTS--GITPLVSTLPALLAKSCSCYNPFVYAISHPKYRLAITQHLPWFCV--- ----HE-TETKS-NDDSQSNSTVAQDKA--------------------------------- ------------------------------------------------------------- --- +--------------------------------MTNATGPQMAY----------------Y +GAAS--MD-FGY----PEGVSIVDFVRPEIKP--------YVHQHWYNYPPVNPMWHYLL +GVIYLFLGTVSIFGNGLVIYLFNKSAALRTPANILVVNLALSDLIMLTTN-VPFFTYNCF +SGGVWM--FSPQYCEIYACLGAITGVCSIWLLCMISFDRYNIICNGFNG-PKLTTGKAVV +FALISWVIAIGC-ALPPFFG-W-----GNYILEGILDSCSYDYLT--QDFNTFSYNIFIF +VFDYFLPAAIIVFSYVFIVKAIFAHEAAMRAQAKK------------------------- +--------------------------------------------------MN-------- +--VSTL------------------------------------------------------ +----------RS-NEADAQR------AEIRIAKTALVNVSLWFICWTPYALISLKGVM-G +DTS--GITPLVSTLPALLAKSCSCYNPFVYAISHPKYRLAITQHLPWFCV------HE-T +ETKS--NDDSQSNSTVAQDK-A-------------------------------------- +--------------------------------------------------------- > 19== D50583 1 Hemigrapsus sanguineus opsin BcRh1 <compound eye>[J.Exp.Biol.1 ---------------------------------MANVTGPQM----------AFYG----- --------------SGAAT-FGYPEGMTV----------ADFVPDRVKH--MVLDHWYNYP -P--------VNPMWHYLLGVVYLFLGVISIAGNGLVIYLYMKSQALKTPANMLIVNLALS -DLIMLTTN-FPPFCYNCFSGGRWM--FSGTYCEIYAALGAITGVCSIWTLCMISFDRYNI -ICNGFNG-PKLTQGKATFMCGLAWVISVGW-SLPPFFG-W-----GSYTLEGILDSCSYD -YFT--RDMNTITYNICIFIFDFFLPASVIVFSYVFIVKAIFAHEAA-------------- -------------------------------------------------------MRAQAK -KMN---------------VTNLRS------------------------------------ ---------------------NEAETQR------AEIRIAKTALVNVSLWFICWTPYAAIT -IQGLL-GNAE--GITPLLTTLPALLAKSCSCYNPFVYAISHPKFRLAITQHLPWFCV--- ----HE-KDPND-VEENQSSNTQTQEKS--------------------------------- ------------------------------------------------------------- --- +--------------------------------MANVTGPQMAF----------------Y +GSGA--AT-FGY----PEGMTVADFVPDRVKH--------MVLDHWYNYPPVNPMWHYLL +GVVYLFLGVISIAGNGLVIYLYMKSQALKTPANMLIVNLALSDLIMLTTN-FPPFCYNCF +SGGRWM--FSGTYCEIYAALGAITGVCSIWTLCMISFDRYNIICNGFNG-PKLTQGKATF +MCGLAWVISVGW-SLPPFFG-W-----GSYTLEGILDSCSYDYFT--RDMNTITYNICIF +IFDFFLPASVIVFSYVFIVKAIFAHEAAMRAQAKK------------------------- +--------------------------------------------------MN-------- +--VTNL------------------------------------------------------ +----------RS-NEAETQR------AEIRIAKTALVNVSLWFICWTPYAAITIQGLL-G +NAE--GITPLLTTLPALLAKSCSCYNPFVYAISHPKFRLAITQHLPWFCV------HE-K +DPND--VEENQSSNTQTQEK-S-------------------------------------- +--------------------------------------------------------- > 20== K02320 1 D.melanogaster opsin <>[Cell40,851-858'85] ----------------MES-----------FAVAAAQLGPHF----------APLS----- -------------------------NGSV----------VDKVTPDMAH--LISPYWNQFP -A--------MDPIWAKILTAYMIMIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAIS -DFGIMITN-TPMMGINLYF-ETWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQV -IVKGMAG-RPMTIPLALGKM---------------------------YVPEGNLTSCGID -YLE--RDWNPRSYLIFYSIFVYYIPLFLICYSYWFIIAAVSAHEKA-------------- -------------------------------------------------------MREQAK -KMN---------------VKSLRS------------------------------------ ---------------------SEDAEKS------AEGKLAKVALVTITLWFMAWTPYLVIN -CMGLF-KF-E--GLTPLNTIWGACFAKSAACYNPIVYGISHPKYRLALKEKCPCCVF--- ----GK-VDDGK-SSDAQSQATASEAESKA------------------------------- ------------------------------------------------------------- --- +----------ME----SF------------AVAAAQLGPHFAP----------------L +S-----------------NGSVVDKVTPDMAH--------LISPYWNQFPAMDPIWAKIL +TAYMIMIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAISDFGIMITN-TPMMGINLY +F-ETWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQVIVKGMAG-RPMTIPLALG +KM---------------------------YVPEGNLTSCGIDYLE--RDWNPRSYLIFYS +IFVYYIPLFLICYSYWFIIAAVSAHEKAMREQAKK------------------------- +--------------------------------------------------MN-------- +--VKSL------------------------------------------------------ +----------RS-SEDAEKS------AEGKLAKVALVTITLWFMAWTPYLVINCMGLF-K +F-E--GLTPLNTIWGACFAKSAACYNPIVYGISHPKYRLALKEKCPCCVF------GK-V +DDGK--SSDAQSQA-TASEA-ESKA----------------------------------- +--------------------------------------------------------- > 21== K02315 1 D.melanogaster ninaE <>[Cell40,839-850'85] ----------------MES-----------FAVAAAQLGPHF----------APLS----- -------------------------NGSV----------VDKVTPDMAH--LISPYWNQFP -A--------MDPIWAKILTAYMIMIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAIS -DFGIMITN-TPMMGINLYF-ETWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQV -IVKGMAG-RPMTIPLALGKIAYIWFMSSIW-CLAPAFG-W-----SRYVPEGNLTSCGID -YLE--RDWNPRSYLIFYSIFVYYIPLFLICYSYWFIIAAVSAHEKA-------------- -------------------------------------------------------MREQAK -KMN---------------VKSLRS------------------------------------ ---------------------SEDAEKS------AEGKLAKVALVTITLWFMAWTPYLVIN -CMGLF-KF-E--GLTPLNTIWGACFAKSAACYNPIVYGISHPKYRLALKEKCPCCVF--- ----GK-VDDGK-SSDAQSQATASEAESKA------------------------------- ------------------------------------------------------------- --- +----------ME----SF------------AVAAAQLGPHFAP----------------L +S-----------------NGSVVDKVTPDMAH--------LISPYWNQFPAMDPIWAKIL +TAYMIMIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAISDFGIMITN-TPMMGINLY +F-ETWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQVIVKGMAG-RPMTIPLALG +KIAYIWFMSSIW-CLAPAFG-W-----SRYVPEGNLTSCGIDYLE--RDWNPRSYLIFYS +IFVYYIPLFLICYSYWFIIAAVSAHEKAMREQAKK------------------------- +--------------------------------------------------MN-------- +--VKSL------------------------------------------------------ +----------RS-SEDAEKS------AEGKLAKVALVTITLWFMAWTPYLVINCMGLF-K +F-E--GLTPLNTIWGACFAKSAACYNPIVYGISHPKYRLALKEKCPCCVF------GK-V +DDGK--SSDAQSQA-TASEA-ESKA----------------------------------- +--------------------------------------------------------- > 22== X65877 1 Drosophila pseudoobscura Dpse\ninaE <>[Genetics132(1),193-204' ----------------MDS-----------FAAVATQLGPQF----------AAPS----- -------------------------NGSV----------VDKVTPDMAH--LISPYWDQFP -A--------MDPIWAKILTAYMIIIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAIS -DFGIMITN-TPMMGINLYF-ETWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQV -IVKGMAG-RPMTIPLALGKIAYIWFMSTIWCCLAPVFG-W-----SRYVPEGNLTSCGID -YLE--RDWNPRSYLIFYSIFVYYIPLFLICYSYWFIIAAVSAHEKA-------------- -------------------------------------------------------MREQAK -KMN---------------VKSLRS------------------------------------ ---------------------SEDADKS------AEGKLAKVALVTISLWFMAWTPYLVIN -CMGLF-KF-E--GLTPLNTIWGACFAKSAACYNPIVYGISHPKYRLALKEKCPCCVF--- ----GK-VDDGK-SSEAQSQATTSEAESKA------------------------------- ------------------------------------------------------------- --- +----------MD----SF------------AAVATQLGPQFAA----------------P +S-----------------NGSVVDKVTPDMAH--------LISPYWDQFPAMDPIWAKIL +TAYMIIIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAISDFGIMITN-TPMMGINLY +F-ETWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQVIVKGMAG-RPMTIPLALG +KIAYIWFMSTIWCCLAPVFG-W-----SRYVPEGNLTSCGIDYLE--RDWNPRSYLIFYS +IFVYYIPLFLICYSYWFIIAAVSAHEKAMREQAKK------------------------- +--------------------------------------------------MN-------- +--VKSL------------------------------------------------------ +----------RS-SEDADKS------AEGKLAKVALVTISLWFMAWTPYLVINCMGLF-K +F-E--GLTPLNTIWGACFAKSAACYNPIVYGISHPKYRLALKEKCPCCVF------GK-V +DDGK--SSEAQSQA-TTSEA-ESKA----------------------------------- +--------------------------------------------------------- > 23== M12896 1 D.melanogaster Rh2 <>[Cell44,705-710'86] -----------MERSHLPE-----------TPFDLAHSGPRF----------QAQS----- --------------SG---------NGSV----------LDNVLPDMAH--LVNPYWSRFA -P--------MDPMMSKILGLFTLAIMIISCCGNGVVVYIFGGTKSLRTPANLLVLNLAFS -DFCMMASQ-SPVMIINFYY-ETWV--LGPLWCDIYAGCGSLFGCVSIWSMCMIAFDRYNV -IVKGING-TPMTIKTSIMKILFIWMMAVFW-TVMPLIG-W-----SAYVPEGNLTACSID -YMT--RMWNPRSYLITYSLFVYYTPLFLICYSYWFIIAAVAAHEKA-------------- -------------------------------------------------------MREQAK -KMN---------------VKSLRS------------------------------------ ---------------------SEDCDKS------AEGKLAKVALTTISLWFMAWTPYLVIC -YFGLF-KI-D--GLTPLTTIWGATFAKTSAVYNPIVYGISHPKYRIVLKEKCPMCVF--- ----GN-TDEPKPDAPASDTETTSEADSKA------------------------------- ------------------------------------------------------------- --- +-----MERSHLP----ET------------PFDLAHSGPRFQA----------------Q +SSG---------------NGSVLDNVLPDMAH--------LVNPYWSRFAPMDPMMSKIL +GLFTLAIMIISCCGNGVVVYIFGGTKSLRTPANLLVLNLAFSDFCMMASQ-SPVMIINFY +Y-ETWV--LGPLWCDIYAGCGSLFGCVSIWSMCMIAFDRYNVIVKGING-TPMTIKTSIM +KILFIWMMAVFW-TVMPLIG-W-----SAYVPEGNLTACSIDYMT--RMWNPRSYLITYS +LFVYYTPLFLICYSYWFIIAAVAAHEKAMREQAKK------------------------- +--------------------------------------------------MN-------- +--VKSL------------------------------------------------------ +----------RS-SEDCDKS------AEGKLAKVALTTISLWFMAWTPYLVICYFGLF-K +I-D--GLTPLTTIWGATFAKTSAVYNPIVYGISHPKYRIVLKEKCPMCVF------GN-T +DEPK--PDAPASDTETTSEA-DSKA----------------------------------- +--------------------------------------------------------- > 24== X65878 1 Drosophila pseudoobscura Dpse\Rh2 <>[Genetics132(1),193-204'92 -----------MERSLLPE-----------PPLAMALLGPRF----------EAQT----- --------------GG---------NRSV----------LDNVLPDMAP--LVNPHWSRFA -P--------MDPTMSKILGLFTLVILIISCCGNGVVVYIFGGTKSLRTPANLLVLNLAFS -DFCMMASQ-SPVMIINFYY-ETWV--LGPLWCDIYAACGSLFGCVSIWSMCMIAFDRYNV -IVKGING-TPMTIKTSIMKIAFIWMMAVFW-TIMPLIG-W-----SSYVPEGNLTACSID -YMT--RQWNPRSYLITYSLFVYYTPLFMICYSYWFIIATVAAHEKA-------------- -------------------------------------------------------MRDQAK -KMN---------------VKSLRS------------------------------------ ---------------------SEDCDKS------AENKLAKVALTTISLWFMAWTPYLIIC -YFGLF-KI-D--GLTPLTTIWGATFAKTSAVYNPIVYGISHPNDRLVLKEKCPMCVC--- ----GT-TDEPKPDAPPSDTETTSEAESKD------------------------------- ------------------------------------------------------------- --- +-----MERSLLP----EP------------PLAMALLGPRFEA----------------Q +TGG---------------NRSVLDNVLPDMAP--------LVNPHWSRFAPMDPTMSKIL +GLFTLVILIISCCGNGVVVYIFGGTKSLRTPANLLVLNLAFSDFCMMASQ-SPVMIINFY +Y-ETWV--LGPLWCDIYAACGSLFGCVSIWSMCMIAFDRYNVIVKGING-TPMTIKTSIM +KIAFIWMMAVFW-TIMPLIG-W-----SSYVPEGNLTACSIDYMT--RQWNPRSYLITYS +LFVYYTPLFMICYSYWFIIATVAAHEKAMRDQAKK------------------------- +--------------------------------------------------MN-------- +--VKSL------------------------------------------------------ +----------RS-SEDCDKS------AENKLAKVALTTISLWFMAWTPYLIICYFGLF-K +I-D--GLTPLTTIWGATFAKTSAVYNPIVYGISHPNDRLVLKEKCPMCVC------GT-T +DEPK--PDAPPSDTETTSEA-ESKD----------------------------------- +--------------------------------------------------------- > 25== U26026 1 Apis mellifera long-wavelength rhodopsin <>[] ---------------------------------MIAVSGPSY----------EAFS----- --------------YGGQARF---NNQTV----------VDKVPPDMLH--LIDANWYQYP -P--------LNPMWHGILGFVIGMLGFVSAMGNGMVVYIFLSTKSLRTPSNLFVINLAIS -NFLMMFCM-SPPMVINCYY-ETWV--LGPLFCQIYAMLGSLFGCGSIWTMTMIAFDRYNV -IVKGLSG-KPLSINGALIRIIAIWLFSLGW-TIAPMFG-W-----NRYVPEGNMTACGTD -YFN--RGLLSASYLVCYGIWVYFVPLFLIIYSYWFIIQAVAAHEKN-------------- -------------------------------------------------------MREQAK -KMN---------------VASLRS------------------------------------ ---------------------SENQNTS------AECKLAKVALMTISLWFMAWTPYLVIN -FSGIF-NL-V--KISPLFTIWGSLFAKANAVYNPIVYGISHPKYRAALFAKFPSLAC--- -----A-AEPSS-DAVSTTSGTTTVTDNEKSNA---------------------------- ------------------------------------------------------------- --- +--------------------------------MIAVSGPSYEA----------------F +SYGG--QARF-------NNQTVVDKVPPDMLH--------LIDANWYQYPPLNPMWHGIL +GFVIGMLGFVSAMGNGMVVYIFLSTKSLRTPSNLFVINLAISNFLMMFCM-SPPMVINCY +Y-ETWV--LGPLFCQIYAMLGSLFGCGSIWTMTMIAFDRYNVIVKGLSG-KPLSINGALI +RIIAIWLFSLGW-TIAPMFG-W-----NRYVPEGNMTACGTDYFN--RGLLSASYLVCYG +IWVYFVPLFLIIYSYWFIIQAVAAHEKNMREQAKK------------------------- +--------------------------------------------------MN-------- +--VASL------------------------------------------------------ +----------RS-SENQNTS------AECKLAKVALMTISLWFMAWTPYLVINFSGIF-N +L-V--KISPLFTIWGSLFAKANAVYNPIVYGISHPKYRAALFAKFPSLAC-------A-A +EPSS--DAVSTTSGTTTVTD-NEKSNA--------------------------------- +--------------------------------------------------------- > 26== L03781 1 Limulus polyphemus opsin <>[PNAS90,6150-6154'93] -----------------------------------MANQLSY----------SSLG----- --------------WPYQP------NASV----------VDTMPKEMLY--MIHEHWYAFP -P--------MNPLWYSILGVAMIILGIICVLGNGMVIYLMMTTKSLRTPTNLLVVNLAFS -DFCMMAFM-MPTMTSNCFA-ETWI--LGPFMCEVYGMAGSLFGCASIWSMVMITLDRYNV -IVRGMAA-APLTHKKATLLLLFVWIWSGGW-TILPFFG-W-----SRYVPEGNLTSCTVD -YLT--KDWSSASYVVIYGLAVYFLPLITMIYCYFFIVHAVAEHEKQ-------------- -------------------------------------------------------LREQAK -KMN---------------VASLRA------------------------------------ --------------------NADQQKQS------AECRLAKVAMMTVGLWFMAWTPYLIIS -WAGVF-SSGT--RLTPLATIWGSVFAKANSCYNPIVYGISHPRYKAALYQRFPSLAC--- ----GS-GESGS-DVKSEASATTTMEEKPKIPEA--------------------------- ------------------------------------------------------------- --- +----------------------------------MANQLSYSS----------------L +GWPY--QP----------NASVVDTMPKEMLY--------MIHEHWYAFPPMNPLWYSIL +GVAMIILGIICVLGNGMVIYLMMTTKSLRTPTNLLVVNLAFSDFCMMAFM-MPTMTSNCF +A-ETWI--LGPFMCEVYGMAGSLFGCASIWSMVMITLDRYNVIVRGMAA-APLTHKKATL +LLLFVWIWSGGW-TILPFFG-W-----SRYVPEGNLTSCTVDYLT--KDWSSASYVVIYG +LAVYFLPLITMIYCYFFIVHAVAEHEKQLREQAKK------------------------- +--------------------------------------------------MN-------- +--VASL------------------------------------------------------ +----------RANADQQKQS------AECRLAKVAMMTVGLWFMAWTPYLIISWAGVF-S +SGT--RLTPLATIWGSVFAKANSCYNPIVYGISHPRYKAALYQRFPSLAC------GS-G +ESGS--DVKSEASATTTMEE-KPKIPEA-------------------------------- +--------------------------------------------------------- > 27== X07797 1 Octopus dofleini rhodopsin <>[FEBS232(1),69-72'88] ----------------------------------------MV----------ESTT----- --------------LVNQT-WWY--NPTV----------D------------IHPHWAKFD -P--------IPDAVYYSVGIFIGVVGIIGILGNGVVIYLFSKTKSLQTPANMFIINLAMS -DLSFSAINGFPLKTISAFM-KKWI--FGKVACQLYGLLGGIFGFMSINTMAMISIDRYNV -IGRPMAASKKMSHRRAFLMIIFVWMWSIVW-SVGPVFN-W-----GAYVPEGILTSCSFD -YLS--TDPSTRSFILCMYFCGFMLPIIIIAFCYFNIVMSVSNHEKE-------------- -------------------------------------------------------MAAMAK -RLN---------------AKELR------------------------------------- ---------------------KAQAGAS------AEMKLAKISMVIITQFMLSWSPYAIIA -LLAQF-GPAE--WVTPYAAELPVLFAKASAIHNPIVYSVSHPKFREAIQTTFPWLLTCCQ -FDEKE-CEDAN-DAEEEVVASER--GGESRDAAQMKEMMAMMQKMQAQQAAYQPPPPPQG -Y--PPQGYPPQGAYPPPQGYPPQGYPPQGYPPQGYPPQGAPPQVEAPQGAPPQGVDNQAY -QA +---------------------------------------MVES----------------T +TLVN--QT-WWY------NPTVD------------------IHPHWAKFDPIPDAVYYSV +GIFIGVVGIIGILGNGVVIYLFSKTKSLQTPANMFIINLAMSDLSFSAINGFPLKTISAF +M-KKWI--FGKVACQLYGLLGGIFGFMSINTMAMISIDRYNVIGRPMAASKKMSHRRAFL +MIIFVWMWSIVW-SVGPVFN-W-----GAYVPEGILTSCSFDYLS--TDPSTRSFILCMY +FCGFMLPIIIIAFCYFNIVMSVSNHEKEMAAMAKR------------------------- +--------------------------------------------------LN-------- +--AKEL------------------------------------------------------ +----------R--KAQAGAS------AEMKLAKISMVIITQFMLSWSPYAIIALLAQF-G +PAE--WVTPYAAELPVLFAKASAIHNPIVYSVSHPKFREAIQTTFPWLLTCCQFDEKE-C +EDAN--DAEEEVVASER--G-GESRDAAQMKEMMAMMQKMQAQQAAYQPPPPPQGY--PP +QGYPPQGAYPPPQGYPPQGYPPQGYPPQGYPPQGAPPQVEAPQGAPPQGVDNQAYQA > 28== X70498 1 Todarodes pacificus rhodopsin <retina>[FEBS317(1-2),5-11'93] -----------------------------------------M----------GRDL----- --------------RDNET-WWY--NPSI----------V------------VHPHWREFD -Q--------VPDAVYYSLGIFIGICGIIGCGGNGIVIYLFTKTKSLQTPANMFIINLAFS -DFTFSLVNGFPLMTISCFL-KKWI--FGFAACKVYGFIGGIFGFMSIMTMAMISIDRYNV -IGRPMAASKKMSHRRAFIMIIFVWLWSVLW-AIGPIFG-W-----GAYTLEGVLCNCSFD -YIS--RDSTTRSNILCMFILGFFGPILIIFFCYFNIVMSVSNHEKE-------------- -------------------------------------------------------MAAMAK -RLN---------------AKELR------------------------------------- ---------------------KAQAGAN------AEMRLAKISIVIVSQFLLSWSPYAVVA -LLAQF-GPLE--WVTPYAAQLPVMFAKASAIHNPMIYSVSHPKFREAISQTFPWVLTCCQ -FDDKE-TEDDK-DAETEIPAGESSDAAPSADAAQMKEMMAMMQKMQQQQAAY----PPQG -YAPPPQGYPPQGY--PPQGYPPQGYPPQGYPP---PPQGAPPQ-GAPPAAPPQGVDNQAY -QA +----------------------------------------MGR----------------D +LRDN--ET-WWY------NPSIV------------------VHPHWREFDQVPDAVYYSL +GIFIGICGIIGCGGNGIVIYLFTKTKSLQTPANMFIINLAFSDFTFSLVNGFPLMTISCF +L-KKWI--FGFAACKVYGFIGGIFGFMSIMTMAMISIDRYNVIGRPMAASKKMSHRRAFI +MIIFVWLWSVLW-AIGPIFG-W-----GAYTLEGVLCNCSFDYIS--RDSTTRSNILCMF +ILGFFGPILIIFFCYFNIVMSVSNHEKEMAAMAKR------------------------- +--------------------------------------------------LN-------- +--AKEL------------------------------------------------------ +----------R--KAQAGAN------AEMRLAKISIVIVSQFLLSWSPYAVVALLAQF-G +PLE--WVTPYAAQLPVMFAKASAIHNPMIYSVSHPKFREAISQTFPWVLTCCQFDDKE-T +EDDK--DAETEIPAGESSDA-APSADAAQMKEMMAMMQKMQQQQAAY----PPQGYAPPP +QGYPPQGY--PPQGYPPQGYPPQGYPP---PPQGAPPQ-GAPPAAPPQGVDNQAYQA > 29== L21195 1 human serotonin 5-HT7 receptor protein <placenta and fetal bra ----------MMDVNSSGRPDLYGHLRSF-LLPEVGRGLPDL----------SPDGGADPV -AGSWAPHLLS---EVTAS-----PAPTW------------DAPPDNAS--GCGEQIN--- ----------YGRVEKVVIGSILTLITLLTIAGNCLVVISVCFVKKLRQPSNYLIVSLALA -DLSVAVAV-MPFVSVTDLIGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYLG -ITRPLTYPVRQNGKCMAKMILSVWLLSASI-TLPPLFG-W-----AQNVNDDKVCLISQD -F----------GYTIYSTAVAFYIPMSVMLFMYYQIYKAARKSAAKHKF----------- ---------------------------------------------P----GFPRVEPDSVI -ALNG--------------IVKLQ----------------------KEVEECANLSR---- ---------------LLKHERKNISIFK------REQKAATTLGIIVGAFTVCWLPFFLLS -TARPFICGTSCSCIPLWVERTFLWLGYANSLINPFIYAFFNRDLRTTYRSLLQC------ ----QY-RNINR--KLSAAGMHEALKLAER------------------------------- ------------------------------------PERPEFVL-QNADYCRKKGHDS--- --- +---------MMDVNSSGRPDLYGHLRSFL-LPEVGRGLPDLSPDGGA------------D +PVAGSWAPHLLS------EVTASPAPTWDAPPDNASGCGEQIN--------YGRVEKVVI +GSILTLITLLTIAGNCLVVISVCFVKKLRQPSNYLIVSLALADLSVAVAV-MPFVSVTDL +IGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYLGITRPLTYPVRQNGKCMAK +MILSVWLLSASI-TLPPLFG-W-----AQNVNDDKVCLISQDF----------GYTIYST +AVAFYIPMSVMLFMYYQIY-------KAARKSAAKHKF---------------------- +---------------------------------PGFPRV----EPDSVIALNG------- +--IVKL----------------------QK---------EVEECAN-------------- +----LSRLLKHERKNISIFK------REQKAATTLGIIVGAFTVCWLPFFLLSTARPFIC +GTSCSCIPLWVERTFLWLGYANSLINPFIYAFFNRDLRTTYRSLLQCQYR----NINR-- +------KLSAAGMHEALKLAERPERPEF------------VLQNADY------------- +--------------------------------------------CRKKGHDS----- > 30== L15228 1 rat 5HT-7 serotonin receptor <>[JBC268,18200-18204'93] ------------------------------------------------------------ -----MPHLLSGFLEVTAS-----PAPTW------------DAPPDNVS--GCGEQIN--- ----------YGRVEKVVIGSILTLITLLTIAGNCLVVISVSFVKKLRQPSNYLIVSLALA -DLSVAVAV-MPFVSVTDLIGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYLG -ITRPLTYPVRQNGKCMAKMILSVWLLSASI-TLPPLFG-W-----AQNVNDDKVCLISQD -F----------GYTIYSTAVAFYIPMSVMLFMYYQIYKAARKSAAKHKF----------- ---------------------------------------------P----GFPRVQPESVI -SLNG--------------VVKLQ----------------------KEVEECANLSR---- ---------------LLKHERKNISIFK------REQKAATTLGIIVGAFTVCWLPFFLLS -TARPFICGTSCSCIPLWVERTCLWLGYANSLINPFIYAFFNRDLRPTSRSLLQC------ ----QY-RNINR--KLSAAGMHEALKLAER------------------------------- ------------------------------------PERSEFVL-QNSDHCGKKGHDT--- --- +------MPHLLS---GFLEVTASPAPTWDAPPDNVSGCGEQIN--------YGRVEKVVI +GSILTLITLLTIAGNCLVVISVSFVKKLRQPSNYLIVSLALADLSVAVAV-MPFVSVTDL +IGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYLGITRPLTYPVRQNGKCMAK +MILSVWLLSASI-TLPPLFG-W-----AQNVNDDKVCLISQDF----------GYTIYST +AVAFYIPMSVMLFMYYQIY-------KAARKSAAKHKF---------------------- +---------------------------------PGFPRV----QPESVISLNG------- +--VVKL----------------------QK---------EVEECAN-------------- +----LSRLLKHERKNISIFK------REQKAATTLGIIVGAFTVCWLPFFLLSTARPFIC +GTSCSCIPLWVERTCLWLGYANSLINPFIYAFFNRDLRPTSRSLLQCQYR----NINR-- +------KLSAAGMHEALKLAERPERSEF------------VLQNSDH------------- +--------------------------------------------CGKKGHDT----- > 31=p A47425 serotonin receptor 5HT-7 - rat ------------------------------------------------------------ -----MPHLLSGFLEVTAS-----PAPTW------------DAPPDNVS--GCGEQIN--- ----------YGRVEKVVIGSILTLITLLTIAGNCLVVISVSFVKKLRQPSNYLIVSLALA -DLSVAVAV-MPFVSVTDLIGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYLG -ITRPLTYPVRQNGKCMAKMILSVWLLSASI-TLPPLFG-W-----AQNVNDDKVCLISQD -F----------GYTIYSTAVAFYIPMSVMLFMYYQIYKAARKSAAKHKF----------- ---------------------------------------------P----GFPRVQPESVI -SLNG--------------VVKLQ----------------------KEVEECANLSR---- ---------------LLKHERKNISIFK------REQKAATTLGIIVGAFTVCWLPFFLLS -TARPFICGTSCSCIPLWVERTCLWLGYANSLINPFIYAFFNRDLRTTYRSLLQC------ ----QY-RNINR--KLSAAGMHEALKLAER------------------------------- ------------------------------------PERSEFVL-QNSDHCGKKGHDT--- --- +------MPHLLS---GFLEVTASPAPTWDAPPDNVSGCGEQIN--------YGRVEKVVI +GSILTLITLLTIAGNCLVVISVSFVKKLRQPSNYLIVSLALADLSVAVAV-MPFVSVTDL +IGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYLGITRPLTYPVRQNGKCMAK +MILSVWLLSASI-TLPPLFG-W-----AQNVNDDKVCLISQDF----------GYTIYST +AVAFYIPMSVMLFMYYQIY-------KAARKSAAKHKF---------------------- +---------------------------------PGFPRV----QPESVISLNG------- +--VVKL----------------------QK---------EVEECAN-------------- +----LSRLLKHERKNISIFK------REQKAATTLGIIVGAFTVCWLPFFLLSTARPFIC +GTSCSCIPLWVERTCLWLGYANSLINPFIYAFFNRDLRTTYRSLLQCQYR----NINR-- +------KLSAAGMHEALKLAERPERSEF------------VLQNSDH------------- +--------------------------------------------CGKKGHDT----- > 32== M83181 1 human serotonin receptor <>[JBC267(11),7553-7562'92] -----------MDVLSPG------------QGNNTTSPPAPF----------ETGG----- --------------NTTGI-----SDVTV-------------------------------- -------------SYQVITSLLLGTLIFCAVLGNACVVAAIALERSLQNVANYLIGSLAVT -DLMVSVLV-LPMAALYQVL-NKWT--LGQVTCDLFIALDVLCCTSSILHLCAIALDRYWA -ITDPIDYVNKRTPRRAAALISLTWLIGFLI-SIPPMLG-WRTPEDRSDPDA---CTISKD -H----------GYTIYSTFGAFYIPLLLMLVLYGRIFRAARFRIRK-------------- --------------------------TVKKVEKTGADTRHGASPAP---------QPKKS- --VNGESGSRNWRL-----GVESKAGGALCANGAVRQGDDGAALEVIEVHRVGNSKEHLPL -PSEAG--PTPCAPASFERKNERNAEAKRKMALARERKTVKTLGIIMGTFILCWLPFFIVA -LVLPF-CESSC-HMPTLLGAIINWLGYSNSLLNPVIYAYFNKDFQNAFKKIIKC------ ----KF-CRQ--------------------------------------------------- +----------MDVLSP-------------------------------------------- +---------------GQGNNTTSPPAPFET-GGNTTGISDVT---------VSYQ--VIT +SLLLGTLIFCAVLGNACVVAAIALERSLQNVANYLIGSLAVTDLMVSVLV-LPMAALYQV +L-NKWT--LGQVTCDLFIALDVLCCTSSILHLCAIALDRYWAITDPIDYVNKRTPRRAAA +LISLTWLIGFLI-SIPPMLG-WRTPEDRSDPD---ACTISKDH----------GYTIYST +FGAFYIPLLLMLVLYGRIF-------RAARFRIRK------------------------- +--------------TVKKVEKTGADTRHGASPAPQPKKS-----------VNGESGSR-- +-------NWRLGVESKAGGALCANGAVRQGDDGAALEVIEVHRVGNSKEHLPLPSEAG-- +PTPCAPASFERKNERNAEAKRKMALARERKTVKTLGIIMGTFILCWLPFFIVALVLPF-C +ESSC-HMPTLLGAIINWLGYSNSLLNPVIYAYFNKDFQNAFKKIIKCKFC----RQ---- ------------------------------------------------------------ --- +--------------------------------------------------------- > 33=p A35181 serotonin receptor class 1A - rat -----------MDVFSFG------------QGNNTTASQEPF----------GTGG----- --------------NVTSI-----SDVTF-------------------------------- -------------SYQVITSLLLGTLIFCAVLGNACVVAAIALERSLQNVANYLIGSLAVT -DLMVSVLV-LPMAALYQVL-NKWT--LGQVTCDLFIALDVLCCTSSILHLCAIALDRYWA -ITDPIDYVNKRTPRRAAALISLTWLIGFLI-SIPPMLG-WRTPEDRSDPDA---CTISKD -H----------GYTIYSTFGAFYIPLLLMLVLYGRIFRAARFRIRK-------------- --------------------------TVRKVEKKGAGTSLGTSSAP---------PPKKS- --LNGQPGSGDWRR-----CAENRAVGTPCTNGAVRQGDDEATLEVIEVHRVGNSKEHLPL -PSESG--SNSYAPACLERKNERNAEAKRKMALARERKTVKTLGIIMGTFILCWLPFFIVA -LVLPF-CESSC-HMPALLGAIINWLGYSNSLLNPVIYAYFNKDFQNAFKKIIKC------ ----KF-CRR--------------------------------------------------- +----------MDVFSF-------------------------------------------- +---------------GQGNNTTASQEPFGT-GGNVTSISDVT---------FSYQ--VIT +SLLLGTLIFCAVLGNACVVAAIALERSLQNVANYLIGSLAVTDLMVSVLV-LPMAALYQV +L-NKWT--LGQVTCDLFIALDVLCCTSSILHLCAIALDRYWAITDPIDYVNKRTPRRAAA +LISLTWLIGFLI-SIPPMLG-WRTPEDRSDPD---ACTISKDH----------GYTIYST +FGAFYIPLLLMLVLYGRIF-------RAARFRIRK------------------------- +--------------TVRKVEKKGAGTSLGTSSAPPPKKS-----------LNGQPGSG-- +-------DWRRCAENRAVGTPCTNGAVRQGDDEATLEVIEVHRVGNSKEHLPLPSESG-- +SNSYAPACLERKNERNAEAKRKMALARERKTVKTLGIIMGTFILCWLPFFIVALVLPF-C +ESSC-HMPALLGAIINWLGYSNSLLNPVIYAYFNKDFQNAFKKIIKCKFC----RR---- ------------------------------------------------------------ --- +--------------------------------------------------------- > 34== L06803 1 Lymnaea stagnalis serotonin receptor <>[PNAS90,11-15'93] -MANFTFGDLALDVARMG-----GLASTPSGLRSTGLTTPGL----------SPTG----- --------------LVTSD-----FNDSYGLTGQFINGSHSSRSRDNAS--ANDTSATNMT -DDRYWSLTVYSHEHLVLTSVILGLFVLCCIIGNCFVIAAVMLERSLHNVANYLILSLAVA -DLMVAVLV-MPLSVVSEIS-KVWF--LHSEVCDMWISVDVLCCTASILHLVAIAMDRYWA -VTS-IDYIRRRSARRILLMIMVVWIVALFI-SIPPLFG-WRDP--NNDPDKTGTCIISQD -K----------GYTIFSTVGAFYLPMLVMMIIYIRIWLVARSRIRKDKFQMTKARLKTEE -TTLVASPKTEYSVVSDCNGCNSPDSTTEKKKRRAPFKSYGCSPRPERKKNRAKKLPENAN -GVNSNSSS----------SERLKQIQIETAEAFANGCAEEASIAMLERQ-CNNGKKISSN -DTPYS-------------RTREKLELK------RERKAARTLAIITGAFLICWLPFFIIA -LIGPF-VDPE--GIPPFARSFVLWLGYFNSLLNPIIYTIFSPEFRSAFQKILFG------ ----KY-RRGHR------------------------------------------------- +MANFTFGDLALDVARMG-----GLASTPSGLRSTGLTTPGLSPTGLV------------T +SDFN--DSYGLT---GQFINGSHSSRSRDNASANDTSATNMTDDRYWSLTVYSHEHLVLT +SVILGLFVLCCIIGNCFVIAAVMLERSLHNVANYLILSLAVADLMVAVLV-MPLSVVSEI +S-KVWF--LHSEVCDMWISVDVLCCTASILHLVAIAMDRYWAVTS-IDYIRRRSARRILL +MIMVVWIVALFI-SIPPLFG-WRDP--NNDPDKTGTCIISQDK----------GYTIFST +VGAFYLPMLVMMIIYIRIW-------LVARSRIRKDKFQMTKARLKTEETTLVASPKTEY +SVVSDCNGCNSPDSTTEKKKRRAPFKSYGCSPRPERKKNRAKKLPENANGVNSNSSS--- +-------SERLKQIQIETAEAFANGCA----EEASIAMLERQ-CNNGKKISSNDTPYS-- +-----------RTREKLELK------RERKAARTLAIITGAFLICWLPFFIIALIGPF-V +DPE--GIPPFARSFVLWLGYFNSLLNPIIYTIFSPEFRSAFQKILFGKYR----RGHR-- ------------------------------------------------------------ --- +--------------------------------------------------------- > 35=p A47174 serotonin receptor, 5HTlym receptor - great pond snail -MANFTFGDLALDVARMG-----GLASTPSGLRSTGLTTPGL----------SPTG----- --------------LVTSD-----FNDSYGLTGQFINGSHSSRSRDNAS--ANDTSATNMT -DDRYWSLTVYSHEHLVLTSVILGLFVLCCIIGNCFVIAAVMLERSLHNVANYLILSLAVA -DLMVAVLV-MPLSVVSEIS-KVWF--LHSEVCDMWISVDVLCCTASILHLVAIAMDRYWA -VTS-IDYIRRRSARRILLMIMVVWIVALFI-SIPPLFG-WRDP--NNDPDKTGTCIISQD -K----------GYTIFSTVGAFYLPMLVMMIIYIRIWLVARSRIRKDKFQMTKARLKTEE -TTLVASPKTEYSVVSDCNGCNSPDSTTEKKKRRAPFKSYGCSPRPERKKNRAKKLPENAN -GVNSNSSS----------SERLKQIQIETAEAFANGCAEEASIAMLERQ-CNNGKKISSN -DTPYS-------------RTREKLELK------RERKAARTLAIITGAFLICWLPFFIIA -LIGPF-VDPE--GIPPFARSFVLWLGYFNSLLNPIIYTIFSPEFRSAFQKILFG------ ----KY-RRGHR------------------------------------------------- +MANFTFGDLALDVARMG-----GLASTPSGLRSTGLTTPGLSPTGLV------------T +SDFN--DSYGLT---GQFINGSHSSRSRDNASANDTSATNMTDDRYWSLTVYSHEHLVLT +SVILGLFVLCCIIGNCFVIAAVMLERSLHNVANYLILSLAVADLMVAVLV-MPLSVVSEI +S-KVWF--LHSEVCDMWISVDVLCCTASILHLVAIAMDRYWAVTS-IDYIRRRSARRILL +MIMVVWIVALFI-SIPPLFG-WRDP--NNDPDKTGTCIISQDK----------GYTIFST +VGAFYLPMLVMMIIYIRIW-------LVARSRIRKDKFQMTKARLKTEETTLVASPKTEY +SVVSDCNGCNSPDSTTEKKKRRAPFKSYGCSPRPERKKNRAKKLPENANGVNSNSSS--- +-------SERLKQIQIETAEAFANGCA----EEASIAMLERQ-CNNGKKISSNDTPYS-- +-----------RTREKLELK------RERKAARTLAIITGAFLICWLPFFIIALIGPF-V +DPE--GIPPFARSFVLWLGYFNSLLNPIIYTIFSPEFRSAFQKILFGKYR----RGHR-- ------------------------------------------------------------ --- +--------------------------------------------------------- > 36== X95604 1 Bombyx mori serotonin receptor <antennae>[InsectBiochem.Mol.Bi --MEGAEGQEELDWEAL-------YLRLP--LQNCSWNSTGW----------EPNW----- --------------NVTVV-----PNTTW---------WQASAPFDTPA--ALVRAAAK-- -------------------AVVLGLLILATVVGNVFVIAAILLERHLRSAANNLILSLAVA -DLLVACLV-MPLGAVYEVV-QRWT--LGPELCDMWTSGDVLCCTASILHLVAIALDRYWA -VTN-IDYIHASTAKRVGMMIACVWTVSFFV-CIAQLLG-WKDPDWNQRVSEDLRCVVSQD -V----------GYQIFATASSFYVPVLIILILYWRIYQTARKRIR--------------- -------------------------------RRRGATARGGVGPPP---------VPAGGA -LVAGGGSGGIAAAVVAVIGRPLPTISETTTTGFTNVSSNNTS---PEKQSCANGLEADPP -TTGYGAVAAAYYPSLVRRKPKEAADSK------RERKAAKTLAIITGAFVACWLPFFVLA -ILVPT-CDCE---VSPVLTSLSLWLGYFNSTLNPVIYTVFSPEFRHAFQRLLCG------ ----RR-VRRRR--A---------------------------------------------- ------------------------------------PQ----------------------- --- +-MEGAEGQEELDWEAL-------YLRLP--LQNCSWNSTGWEPNWNV------------T +VVPN--TTWW------------QASAPFDTPAALVRAAAK-------------------- +AVVLGLLILATVVGNVFVIAAILLERHLRSAANNLILSLAVADLLVACLV-MPLGAVYEV +V-QRWT--LGPELCDMWTSGDVLCCTASILHLVAIALDRYWAVTN-IDYIHASTAKRVGM +MIACVWTVSFFV-CIAQLLG-WKDPDWNQRVSEDLRCVVSQDV----------GYQIFAT +ASSFYVPVLIILILYWRIY-------QTARKRIR-------------------------- +-------------------RRRGATARGGVGPPP---------VPAGGALVAGGGSGGIA +AAVVAVIGRPLPTISETTTTGFTNVSS----NNTSP---EKQSCANGLEADPPTTGYGAV +AAAYYPSLVRRKPKEAADSK------RERKAAKTLAIITGAFVACWLPFFVLAILVPT-C +DCE---VSPVLTSLSLWLGYFNSTLNPVIYTVFSPEFRHAFQRLLCGRRV----RRRR-- +------A---------------PQ------------------------------------ +---------------------------------------------------------
--- a/test-data/mafft_nwns_result.aln Sat Nov 11 15:06:34 2017 -0500 +++ b/test-data/mafft_nwns_result.aln Wed Apr 15 15:33:37 2020 -0400 @@ -1,270 +1,270 @@ -CLUSTAL format alignment by MAFFT NW-NS-2 (v7.221) +CLUSTAL format alignment by MAFFT NW-NS-2 (v7.455) -1== --------------------------------MNGTE--------------GDNF----- -2== --------------------------------MNGTE--------------GPNF----- -3== --------------------------------MNGTE--------------GINF----- -4=p --------------------------------MNGTE--------------GKNF----- -5=p --------------------------------MNGTE--------------GNNF----- -6== --------------------------------MKQVPEF------------HEDF----- -7== --------------------------------MRKMS--------------EEEF----- +1== ----------------------------------------MNG----------------T +2== ----------------------------------------MNG----------------T +3== ----------------------------------------MNG----------------T +4=p ----------------------------------------MNG----------------T +5=p ----------------------------------------MNG----------------T +6== ----------------------------------------MKQ----------------V +7== ----------------------------------------MRK----------------M 8=opsin, ------------------------------------------------------------ -9== --------------------------------MAQQWSLQRLAGRHPQDSYEDST----- -10== --------------------------------MAQQWSLQRLAGRHPQDSYEDST----- -11== --------------------------------MTEAWNVAVFAARRSRDD-DDTT----- -12== --------------------------------MAA-WEAAFAARRRHEE--EDTT----- -13== --------------------------------MS-----------------SNSS----- -14== ----------MES--GNV-----------SSSLFGNVSTAL----------RPEA----- -15== ----------MEY--HNV-----------SSVL-GNVSSVL----------RPDA----- -16== ----------ME-------------------PLCNASEPPL----------RPEA----- -17== ----------MD-------------------ALCNASEPPL----------RPEA----- -18== --------------------------------MTNATGPQM----------AYYG----- -19== --------------------------------MANVTGPQM----------AFYG----- -20== ---------------MES-----------FAVAAAQLGPHF----------APLS----- -21== ---------------MES-----------FAVAAAQLGPHF----------APLS----- -22== ---------------MDS-----------FAAVATQLGPQF----------AAPS----- -23== ----------MERSHLPE-----------TPFDLAHSGPRF----------QAQS----- -24== ----------MERSLLPE-----------PPLAMALLGPRF----------EAQT----- -25== --------------------------------MIAVSGPSY----------EAFS----- -26== ----------------------------------MANQLSY----------SSLG----- -27== ---------------------------------------MV----------ESTT----- -28== ----------------------------------------M----------GRDL----- -29== ---------MMDVNSSGRPDLYGHLRSF-LLPEVGRGLPDL----------SPDGGADPV +9== ----------------------------------------MAQQWSLQRLAGRHPQDSYE +10== ----------------------------------------MAQQWSLQRLAGRHPQDSYE +11== ----------------------------------------MTEAWNVAVFAARRSRDD-D +12== ----------------------------------------MAA-WEAAFAARRRHEE--E +13== ----------------------------------------MS-----------------S +14== ----------MESGNVSS------------SLFGNVST-ALRP----------------E +15== ----------MEYHNVSS------------VL-GNVSS-VLRP----------------D +16== ----------ME------------------PL-CNASEPPLRP----------------E +17== ----------MD------------------AL-CNASEPPLRP----------------E +18== --------------------------------MTNATGPQMAY----------------Y +19== --------------------------------MANVTGPQMAF----------------Y +20== ----------ME----SF------------AVAAAQLGPHFAP----------------L +21== ----------ME----SF------------AVAAAQLGPHFAP----------------L +22== ----------MD----SF------------AAVATQLGPQFAA----------------P +23== -----MERSHLP----ET------------PFDLAHSGPRFQA----------------Q +24== -----MERSLLP----EP------------PLAMALLGPRFEA----------------Q +25== --------------------------------MIAVSGPSYEA----------------F +26== ----------------------------------MANQLSYSS----------------L +27== ---------------------------------------MVES----------------T +28== ----------------------------------------MGR----------------D +29== ---------MMDVNSSGRPDLYGHLRSFL-LPEVGRGLPDLSPDGGA------------D 30== ------------------------------------------------------------ 31=p ------------------------------------------------------------ -32== ----------MDVLSPG------------QGNNTTSPPAPF----------ETGG----- -33=p ----------MDVFSFG------------QGNNTTASQEPF----------GTGG----- -34== MANFTFGDLALDVARMG-----GLASTPSGLRSTGLTTPGL----------SPTG----- -35=p MANFTFGDLALDVARMG-----GLASTPSGLRSTGLTTPGL----------SPTG----- -36== -MEGAEGQEELDWEAL-------YLRLP--LQNCSWNSTGW----------EPNW----- +32== ----------MDVLSP-------------------------------------------- +33=p ----------MDVFSF-------------------------------------------- +34== MANFTFGDLALDVARMG-----GLASTPSGLRSTGLTTPGLSPTGLV------------T +35=p MANFTFGDLALDVARMG-----GLASTPSGLRSTGLTTPGLSPTGLV------------T +36== -MEGAEGQEELDWEAL-------YLRLP--LQNCSWNSTGWEPNWNV------------T -1== -------------YVP-----F-SNKTG----------LARSPYEYPQY-YLAEPWK--- -2== -------------YVP-----F-SNITG----------VVRSPFEQPQY-YLAEPWQ--- -3== -------------YVP-----M-SNKTG----------VVRSPFEYPQY-YLAEPWK--- -4=p -------------YVP-----M-SNRTG----------LVRSPFEYPQY-YLAEPWQ--- -5=p -------------YVP-----L-SNRTG----------LVRSPFEYPQY-YLAEPWQ--- -6== -------------YIPIP-LDI-NNLS------------AYSPFLVPQD-HLGNQGI--- -7== -------------YL------F-KNIS------------SVGPWDGPQY-HIAPVWA--- +1== E--G--DNFYVP----FSNKTGLARSPYEYPQY-------YLAEPWK---------YSAL +2== E--G--PNFYVP----FSNITGVVRSPFEQPQY-------YLAEPWQ---------FSML +3== E--G--INFYVP----MSNKTGVVRSPFEYPQY-------YLAEPWK---------YRLV +4=p E--G--KNFYVP----MSNRTGLVRSPFEYPQY-------YLAEPWQ---------FKIL +5=p E--G--NNFYVP----LSNRTGLVRSPFEYPQY-------YLAEPWQ---------FKLL +6== PEFH--EDFYIPIPLDINNLS--AYSPFLVPQD-------HLGNQGI---------FMAM +7== S--E--EEFYL-----FKNIS--SVGPWDGPQY-------HIAPVWA---------FYLQ 8=opsin, ------------------------------------------------------------ -9== -------------QSSI--FTY-TNSNS-----------TRGPFEGPNY-HIAPRWV--- -10== -------------QSSI--FTY-TNSNS-----------TRGPFEGPNY-HIAPRWV--- -11== -------------RGSV--FTY-TNTNN-----------TRGPFEGPNY-HIAPRWV--- -12== -------------RDSV--FTY-TNSNN-----------TRGPFEGPNY-HIAPRWV--- -13== -------------QAP---------PNG-----------TPGPFDGPQWPYQAPQST--- -14== -------------RLSA------ETRLL----------GWNVPPEELR--HIPEHWLTYP -15== -------------RLSA------ESRLL----------GWNVPPDELR--HIPEHWLIYP -16== -------------R-SSG---NGDLQFL----------GWNVPPDQIQ--YIPEHWLTQL -17== -------------RMSSG---SDELQFL----------GWNVPPDQIQ--YIPEHWLTQL -18== -------------AASMD-FGYPEGVSI----------VDFVRPEIKP--YVHQHWYNYP -19== -------------SGAAT-FGYPEGMTV----------ADFVPDRVKH--MVLDHWYNYP -20== ------------------------NGSV----------VDKVTPDMAH--LISPYWNQFP -21== ------------------------NGSV----------VDKVTPDMAH--LISPYWNQFP -22== ------------------------NGSV----------VDKVTPDMAH--LISPYWDQFP -23== -------------SG---------NGSV----------LDNVLPDMAH--LVNPYWSRFA -24== -------------GG---------NRSV----------LDNVLPDMAP--LVNPHWSRFA -25== -------------YGGQARF---NNQTV----------VDKVPPDMLH--LIDANWYQYP -26== -------------WPYQP------NASV----------VDTMPKEMLY--MIHEHWYAFP -27== -------------LVNQT-WWY--NPTV----------D------------IHPHWAKFD -28== -------------RDNET-WWY--NPSI----------V------------VHPHWREFD -29== AGSWAPHLLS---EVTAS-----PAPTW------------DAPPDNAS--GCGEQIN--- -30== ----MPHLLSGFLEVTAS-----PAPTW------------DAPPDNVS--GCGEQIN--- -31=p ----MPHLLSGFLEVTAS-----PAPTW------------DAPPDNVS--GCGEQIN--- -32== -------------NTTGI-----SDVTV-------------------------------- -33=p -------------NVTSI-----SDVTF-------------------------------- -34== -------------LVTSD-----FNDSYGLTGQFINGSHSSRSRDNAS--ANDTSATNMT -35=p -------------LVTSD-----FNDSYGLTGQFINGSHSSRSRDNAS--ANDTSATNMT -36== -------------NVTVV-----PNTTW---------WQASAPFDTPA--ALVRAAAK-- - - -1== --------------YSALAAYMFFLILVGFPVNFLTLFVTVQHKKLRTPLNYILLNLAMA -2== --------------FSMLAAYMFLLIVLGFPINFLTLYVTVQHKKLRTPLNYILLNLAVA -3== --------------YRLVCCYIFFLISTGLPINLLTLLVTFKHKKLRQPLNYILVNLAVA -4=p --------------FKILALYLFFLMSMGLPINGLTLVVTAQHKKLRQPLNFILVNLAVA -5=p --------------FKLLAVYMFFLICLGLPINGLTLICTAQHKKLRQPLNFILVNLAVA -6== --------------FMAMSVFMFFIFIGGASINILTILCTIQFKKLRSHLNYILVNLSIA -7== --------------FYLQAAFMGTVFLIGFPLNAMVLVATLRYKKLRQPLNYILVNVSFG -8=opsin, ------------------------------------------------------------ -9== --------------YHLTSVWMIFVVIASVFTNGLVLAATMKFKKLRHPLNWILVNLAVA -10== --------------YHLTSVWMIFVVTASVFTNGLVLAATMKFKKLRHPLNWILVNLAVA -11== --------------YNLVSFFMIIVVIASCFTNGLVLVATAKFKKLRHPLNWILVNLAFV -12== --------------YNLTSVWMIFVVAASVFTNGLVLVATWKFKKLRHPLNWILVNLAVA -13== --------------YVGVAVLMGTVVACASVVNGLVIVVSICYKKLRSPLNYILVNLAVA -14== E--------PPESMNYLLGTLYIFFTLMSMLGNGLVIWVFSAAKSLRTPSNILVINLAFC -15== E--------PPESMNYLLGTLYIFFTVISMIGNGLVMWVFSAAKSLRTPSNILVINLAFC -16== E--------PPASMHYMLGVFYIFLFCASTVGNGMVIWIFSTSKSLRTPSNMFVLNLAVF -17== E--------PPASMHYMLGVFYIFLFFASTLGNGMVIWIFSTSKSLRTPSNMFVLNLAVF -18== P--------VNPMWHYLLGVIYLFLGTVSIFGNGLVIYLFNKSAALRTPANILVVNLALS -19== P--------VNPMWHYLLGVVYLFLGVISIAGNGLVIYLYMKSQALKTPANMLIVNLALS -20== A--------MDPIWAKILTAYMIMIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAIS -21== A--------MDPIWAKILTAYMIMIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAIS -22== A--------MDPIWAKILTAYMIIIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAIS -23== P--------MDPMMSKILGLFTLAIMIISCCGNGVVVYIFGGTKSLRTPANLLVLNLAFS -24== P--------MDPTMSKILGLFTLVILIISCCGNGVVVYIFGGTKSLRTPANLLVLNLAFS -25== P--------LNPMWHGILGFVIGMLGFVSAMGNGMVVYIFLSTKSLRTPSNLFVINLAIS -26== P--------MNPLWYSILGVAMIILGIICVLGNGMVIYLMMTTKSLRTPTNLLVVNLAFS -27== P--------IPDAVYYSVGIFIGVVGIIGILGNGVVIYLFSKTKSLQTPANMFIINLAMS -28== Q--------VPDAVYYSLGIFIGICGIIGCGGNGIVIYLFTKTKSLQTPANMFIINLAFS -29== ---------YGRVEKVVIGSILTLITLLTIAGNCLVVISVCFVKKLRQPSNYLIVSLALA -30== ---------YGRVEKVVIGSILTLITLLTIAGNCLVVISVSFVKKLRQPSNYLIVSLALA -31=p ---------YGRVEKVVIGSILTLITLLTIAGNCLVVISVSFVKKLRQPSNYLIVSLALA -32== ------------SYQVITSLLLGTLIFCAVLGNACVVAAIALERSLQNVANYLIGSLAVT -33=p ------------SYQVITSLLLGTLIFCAVLGNACVVAAIALERSLQNVANYLIGSLAVT -34== DDRYWSLTVYSHEHLVLTSVILGLFVLCCIIGNCFVIAAVMLERSLHNVANYLILSLAVA -35=p DDRYWSLTVYSHEHLVLTSVILGLFVLCCIIGNCFVIAAVMLERSLHNVANYLILSLAVA -36== ------------------AVVLGLLILATVVGNVFVIAAILLERHLRSAANNLILSLAVA +9== DSTQ--SSIFT-----YTNSNS-TRGPFEGPNY-------HIAPRWV---------YHLT +10== DSTQ--SSIFT-----YTNSNS-TRGPFEGPNY-------HIAPRWV---------YHLT +11== DTTR--GSVFT-----YTNTNN-TRGPFEGPNY-------HIAPRWV---------YNLV +12== DTTR--DSVFT-----YTNSNN-TRGPFEGPNY-------HIAPRWV---------YNLT +13== NSSQ--AP-----------PNG-TPGPFDGPQW------PYQAPQST---------YVGV +14== ARLS--A----------ETRLLGWNVPPEELR--------HIPEHWLTYPEPPESMNYLL +15== ARLS--A----------ESRLLGWNVPPDELR--------HIPEHWLIYPEPPESMNYLL +16== AR-S--SG---N----GDLQFLGWNVPPDQIQ--------YIPEHWLTQLEPPASMHYML +17== ARMS--SG---S----DELQFLGWNVPPDQIQ--------YIPEHWLTQLEPPASMHYML +18== GAAS--MD-FGY----PEGVSIVDFVRPEIKP--------YVHQHWYNYPPVNPMWHYLL +19== GSGA--AT-FGY----PEGMTVADFVPDRVKH--------MVLDHWYNYPPVNPMWHYLL +20== S-----------------NGSVVDKVTPDMAH--------LISPYWNQFPAMDPIWAKIL +21== S-----------------NGSVVDKVTPDMAH--------LISPYWNQFPAMDPIWAKIL +22== S-----------------NGSVVDKVTPDMAH--------LISPYWDQFPAMDPIWAKIL +23== SSG---------------NGSVLDNVLPDMAH--------LVNPYWSRFAPMDPMMSKIL +24== TGG---------------NRSVLDNVLPDMAP--------LVNPHWSRFAPMDPTMSKIL +25== SYGG--QARF-------NNQTVVDKVPPDMLH--------LIDANWYQYPPLNPMWHGIL +26== GWPY--QP----------NASVVDTMPKEMLY--------MIHEHWYAFPPMNPLWYSIL +27== TLVN--QT-WWY------NPTVD------------------IHPHWAKFDPIPDAVYYSV +28== LRDN--ET-WWY------NPSIV------------------VHPHWREFDQVPDAVYYSL +29== PVAGSWAPHLLS------EVTASPAPTWDAPPDNASGCGEQIN--------YGRVEKVVI +30== ------MPHLLS---GFLEVTASPAPTWDAPPDNVSGCGEQIN--------YGRVEKVVI +31=p ------MPHLLS---GFLEVTASPAPTWDAPPDNVSGCGEQIN--------YGRVEKVVI +32== ---------------GQGNNTTSPPAPFET-GGNTTGISDVT---------VSYQ--VIT +33=p ---------------GQGNNTTASQEPFGT-GGNVTSISDVT---------FSYQ--VIT +34== SDFN--DSYGLT---GQFINGSHSSRSRDNASANDTSATNMTDDRYWSLTVYSHEHLVLT +35=p SDFN--DSYGLT---GQFINGSHSSRSRDNASANDTSATNMTDDRYWSLTVYSHEHLVLT +36== VVPN--TTWW------------QASAPFDTPAALVRAAAK-------------------- -1== NLFMVLFG-FTVTMYTSMN-GYFV--FGPTMCSIEGFFATLGGEVALWSLVVLAIERYIV -2== DLFMVFGG-FTTTLYTSLH-GYFV--FGPTGCNLEGFFATLGGEIGLWSLVVLAIERYVV -3== DLFMACFG-FTVTFYTAWN-GYFV--FGPVGCAVEGFFATLGGQVALWSLVVLAIERYIV -4=p GTIMVCFG-FTVTFYTAIN-GYFV--LGPTGCAVEGFMATLGGEVALWSLVVLAIERYIV -5=p GAIMVCFG-FTVTFYTAIN-GYFA--LGPTGCAVEGFMATLGGEVALWSLVVLAIERYIV -6== NLFVAIFG-SPLSFYSFFN-RYFI--FGATACKIEGFLATLGGMVGLWSLAVVAFERWLV -7== GFLLCIFS-VFPVFVASCN-GYFV--FGRHVCALEGFLGTVAGLVTGWSLAFLAFERYIV -8=opsin, DLAETVIA-STISIVNQVS-GYFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWLV -9== DLAETVIA-STISVVNQVY-GYFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWMV -10== DLAETVIA-STISIVNQVS-GYFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWLV -11== DLVETLVA-STISVFNQIF-GYFI--LGHPLCVIEGYVVSSCGITGLWSLAIISWERWFV -12== DLGETVIA-STISVINQIS-GYFI--LGHPMCVVEGYTVSACGITALWSLAIISWERWFV -13== DLLVTLCG-SSVSLSNNIN-GFFV--FGRRMCELEGFMVSLTGIVGLWSLAILALERYVV -14== DFMMMVK--TPIFIYNSFH-QGYA--LGHLGCQIFGIIGSYTGIAAGATNAFIAYDRFNV -15== DFMMMIK--TPIFIYNSFH-QGYA--LGHLGCQIFGVIGSYTGIAAGATNAFIAYDRYNV -16== DLIMCLK--APIF--NSFH-RGFAIYLGNTWCQIFASIGSYSGIGAGMTNAAIGYDRYNV -17== DLIMCLK--APIFIYNSFH-RGFA--LGNTWCQIFASIGSYSGIGAGMTNAAIGYDRYNV -18== DLIMLTTN-VPFFTYNCFSGGVWM--FSPQYCEIYACLGAITGVCSIWLLCMISFDRYNI -19== DLIMLTTN-FPPFCYNCFSGGRWM--FSGTYCEIYAALGAITGVCSIWTLCMISFDRYNI -20== DFGIMITN-TPMMGINLYF-ETWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQV -21== DFGIMITN-TPMMGINLYF-ETWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQV -22== DFGIMITN-TPMMGINLYF-ETWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQV -23== DFCMMASQ-SPVMIINFYY-ETWV--LGPLWCDIYAGCGSLFGCVSIWSMCMIAFDRYNV -24== DFCMMASQ-SPVMIINFYY-ETWV--LGPLWCDIYAACGSLFGCVSIWSMCMIAFDRYNV -25== NFLMMFCM-SPPMVINCYY-ETWV--LGPLFCQIYAMLGSLFGCGSIWTMTMIAFDRYNV -26== DFCMMAFM-MPTMTSNCFA-ETWI--LGPFMCEVYGMAGSLFGCASIWSMVMITLDRYNV -27== DLSFSAINGFPLKTISAFM-KKWI--FGKVACQLYGLLGGIFGFMSINTMAMISIDRYNV -28== DFTFSLVNGFPLMTISCFL-KKWI--FGFAACKVYGFIGGIFGFMSIMTMAMISIDRYNV -29== DLSVAVAV-MPFVSVTDLIGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYLG -30== DLSVAVAV-MPFVSVTDLIGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYLG -31=p DLSVAVAV-MPFVSVTDLIGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYLG -32== DLMVSVLV-LPMAALYQVL-NKWT--LGQVTCDLFIALDVLCCTSSILHLCAIALDRYWA -33=p DLMVSVLV-LPMAALYQVL-NKWT--LGQVTCDLFIALDVLCCTSSILHLCAIALDRYWA -34== DLMVAVLV-MPLSVVSEIS-KVWF--LHSEVCDMWISVDVLCCTASILHLVAIAMDRYWA -35=p DLMVAVLV-MPLSVVSEIS-KVWF--LHSEVCDMWISVDVLCCTASILHLVAIAMDRYWA -36== DLLVACLV-MPLGAVYEVV-QRWT--LGPELCDMWTSGDVLCCTASILHLVAIALDRYWA - . : : * : : :*: +1== AAYMFFLILVGFPVNFLTLFVTVQHKKLRTPLNYILLNLAMANLFMVLFG-FTVTMYTSM +2== AAYMFLLIVLGFPINFLTLYVTVQHKKLRTPLNYILLNLAVADLFMVFGG-FTTTLYTSL +3== CCYIFFLISTGLPINLLTLLVTFKHKKLRQPLNYILVNLAVADLFMACFG-FTVTFYTAW +4=p ALYLFFLMSMGLPINGLTLVVTAQHKKLRQPLNFILVNLAVAGTIMVCFG-FTVTFYTAI +5=p AVYMFFLICLGLPINGLTLICTAQHKKLRQPLNFILVNLAVAGAIMVCFG-FTVTFYTAI +6== SVFMFFIFIGGASINILTILCTIQFKKLRSHLNYILVNLSIANLFVAIFG-SPLSFYSFF +7== AAFMGTVFLIGFPLNAMVLVATLRYKKLRQPLNYILVNVSFGGFLLCIFS-VFPVFVASC +8=opsin, ------------------------------------------DLAETVIA-STISIVNQV +9== SVWMIFVVIASVFTNGLVLAATMKFKKLRHPLNWILVNLAVADLAETVIA-STISVVNQV +10== SVWMIFVVTASVFTNGLVLAATMKFKKLRHPLNWILVNLAVADLAETVIA-STISIVNQV +11== SFFMIIVVIASCFTNGLVLVATAKFKKLRHPLNWILVNLAFVDLVETLVA-STISVFNQI +12== SVWMIFVVAASVFTNGLVLVATWKFKKLRHPLNWILVNLAVADLGETVIA-STISVINQI +13== AVLMGTVVACASVVNGLVIVVSICYKKLRSPLNYILVNLAVADLLVTLCG-SSVSLSNNI +14== GTLYIFFTLMSMLGNGLVIWVFSAAKSLRTPSNILVINLAFCDFMMMVK--TPIFIYNSF +15== GTLYIFFTVISMIGNGLVMWVFSAAKSLRTPSNILVINLAFCDFMMMIK--TPIFIYNSF +16== GVFYIFLFCASTVGNGMVIWIFSTSKSLRTPSNMFVLNLAVFDLIMCLK--APIF--NSF +17== GVFYIFLFFASTLGNGMVIWIFSTSKSLRTPSNMFVLNLAVFDLIMCLK--APIFIYNSF +18== GVIYLFLGTVSIFGNGLVIYLFNKSAALRTPANILVVNLALSDLIMLTTN-VPFFTYNCF +19== GVVYLFLGVISIAGNGLVIYLYMKSQALKTPANMLIVNLALSDLIMLTTN-FPPFCYNCF +20== TAYMIMIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAISDFGIMITN-TPMMGINLY +21== TAYMIMIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAISDFGIMITN-TPMMGINLY +22== TAYMIIIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAISDFGIMITN-TPMMGINLY +23== GLFTLAIMIISCCGNGVVVYIFGGTKSLRTPANLLVLNLAFSDFCMMASQ-SPVMIINFY +24== GLFTLVILIISCCGNGVVVYIFGGTKSLRTPANLLVLNLAFSDFCMMASQ-SPVMIINFY +25== GFVIGMLGFVSAMGNGMVVYIFLSTKSLRTPSNLFVINLAISNFLMMFCM-SPPMVINCY +26== GVAMIILGIICVLGNGMVIYLMMTTKSLRTPTNLLVVNLAFSDFCMMAFM-MPTMTSNCF +27== GIFIGVVGIIGILGNGVVIYLFSKTKSLQTPANMFIINLAMSDLSFSAINGFPLKTISAF +28== GIFIGICGIIGCGGNGIVIYLFTKTKSLQTPANMFIINLAFSDFTFSLVNGFPLMTISCF +29== GSILTLITLLTIAGNCLVVISVCFVKKLRQPSNYLIVSLALADLSVAVAV-MPFVSVTDL +30== GSILTLITLLTIAGNCLVVISVSFVKKLRQPSNYLIVSLALADLSVAVAV-MPFVSVTDL +31=p GSILTLITLLTIAGNCLVVISVSFVKKLRQPSNYLIVSLALADLSVAVAV-MPFVSVTDL +32== SLLLGTLIFCAVLGNACVVAAIALERSLQNVANYLIGSLAVTDLMVSVLV-LPMAALYQV +33=p SLLLGTLIFCAVLGNACVVAAIALERSLQNVANYLIGSLAVTDLMVSVLV-LPMAALYQV +34== SVILGLFVLCCIIGNCFVIAAVMLERSLHNVANYLILSLAVADLMVAVLV-MPLSVVSEI +35=p SVILGLFVLCCIIGNCFVIAAVMLERSLHNVANYLILSLAVADLMVAVLV-MPLSVVSEI +36== AVVLGLLILATVVGNVFVIAAILLERHLRSAANNLILSLAVADLLVACLV-MPLGAVYEV + . + +1== N-GYFV--FGPTMCSIEGFFATLGGEVALWSLVVLAIERYIVICKPMGN-FRFGNTHAIM +2== H-GYFV--FGPTGCNLEGFFATLGGEIGLWSLVVLAIERYVVVCKPMSN-FRFGENHAIM +3== N-GYFV--FGPVGCAVEGFFATLGGQVALWSLVVLAIERYIVVCKPMGN-FRFSATHAMM +4=p N-GYFV--LGPTGCAVEGFMATLGGEVALWSLVVLAIERYIVVCKPMGS-FKFSSSHAFA +5=p N-GYFA--LGPTGCAVEGFMATLGGEVALWSLVVLAIERYIVVCKPMGS-FKFSSTHASA +6== N-RYFI--FGATACKIEGFLATLGGMVGLWSLAVVAFERWLVICKPLGN-FTFKTPHAIA +7== N-GYFV--FGRHVCALEGFLGTVAGLVTGWSLAFLAFERYIVICKPFGN-FRFSSKHALT +8=opsin, S-GYFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWLVVCKPFGN-VRFDAKLAIV +9== Y-GYFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWMVVCKPFGN-VRFDAKLAIV +10== S-GYFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWLVVCKPFGN-VRFDAKLAIV +11== F-GYFI--LGHPLCVIEGYVVSSCGITGLWSLAIISWERWFVVCKPFGN-IKFDSKLAII +12== S-GYFI--LGHPMCVVEGYTVSACGITALWSLAIISWERWFVVCKPFGN-IKFDGKLAVA +13== N-GFFV--FGRRMCELEGFMVSLTGIVGLWSLAILALERYVVVCKPLGD-FQFQRRHAVS +14== H-QGYA--LGHLGCQIFGIIGSYTGIAAGATNAFIAYDRFNVITRPMEG--KMTHGKAIA +15== H-QGYA--LGHLGCQIFGVIGSYTGIAAGATNAFIAYDRYNVITRPMEG--KMTHGKAIA +16== H-RGFAIYLGNTWCQIFASIGSYSGIGAGMTNAAIGYDRYNVITKPMNR--NMTFTKAVI +17== H-RGFA--LGNTWCQIFASIGSYSGIGAGMTNAAIGYDRYNVITKPMNR--NMTFTKAVI +18== SGGVWM--FSPQYCEIYACLGAITGVCSIWLLCMISFDRYNIICNGFNG-PKLTTGKAVV +19== SGGRWM--FSGTYCEIYAALGAITGVCSIWTLCMISFDRYNIICNGFNG-PKLTQGKATF +20== F-ETWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQVIVKGMAG-RPMTIPLALG +21== F-ETWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQVIVKGMAG-RPMTIPLALG +22== F-ETWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQVIVKGMAG-RPMTIPLALG +23== Y-ETWV--LGPLWCDIYAGCGSLFGCVSIWSMCMIAFDRYNVIVKGING-TPMTIKTSIM +24== Y-ETWV--LGPLWCDIYAACGSLFGCVSIWSMCMIAFDRYNVIVKGING-TPMTIKTSIM +25== Y-ETWV--LGPLFCQIYAMLGSLFGCGSIWTMTMIAFDRYNVIVKGLSG-KPLSINGALI +26== A-ETWI--LGPFMCEVYGMAGSLFGCASIWSMVMITLDRYNVIVRGMAA-APLTHKKATL +27== M-KKWI--FGKVACQLYGLLGGIFGFMSINTMAMISIDRYNVIGRPMAASKKMSHRRAFL +28== L-KKWI--FGFAACKVYGFIGGIFGFMSIMTMAMISIDRYNVIGRPMAASKKMSHRRAFI +29== IGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYLGITRPLTYPVRQNGKCMAK +30== IGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYLGITRPLTYPVRQNGKCMAK +31=p IGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYLGITRPLTYPVRQNGKCMAK +32== L-NKWT--LGQVTCDLFIALDVLCCTSSILHLCAIALDRYWAITDPIDYVNKRTPRRAAA +33=p L-NKWT--LGQVTCDLFIALDVLCCTSSILHLCAIALDRYWAITDPIDYVNKRTPRRAAA +34== S-KVWF--LHSEVCDMWISVDVLCCTASILHLVAIAMDRYWAVTS-IDYIRRRSARRILL +35=p S-KVWF--LHSEVCDMWISVDVLCCTASILHLVAIAMDRYWAVTS-IDYIRRRSARRILL +36== V-QRWT--LGPELCDMWTSGDVLCCTASILHLVAIALDRYWAVTN-IDYIHASTAKRVGM + : : * : : :*: : : -1== ICKPMGN-FRFGNTHAIMGVAFTWIMALAC-AAPPLVG-W-----SRYIPEGMQCSCGPD -2== VCKPMSN-FRFGENHAIMGVAFTWVMALAC-AAPPLVG-W-----SRYIPEGMQCSCGID -3== VCKPMGN-FRFSATHAMMGIAFTWVMAFSC-AAPPLFG-W-----SRYMPEGMQCSCGPD -4=p VCKPMGS-FKFSSSHAFAGIAFTWVMALAC-AAPPLFG-W-----SRYIPEGMQCSCGPD -5=p VCKPMGS-FKFSSTHASAGIAFTWVMAMAC-AAPPLVG-W-----SRYIPEGIQCSCGPD -6== ICKPLGN-FTFKTPHAIAGCILPWISALAA-SLPPLFG-W-----SRYIPEGLQCSCGPD -7== ICKPFGN-FRFSSKHALTVVLATWTIGIGV-SIPPFFG-W-----SRFIPEGLQCSCGPD -8=opsin, VCKPFGN-VRFDAKLAIVGIAFSWIWAAVW-TAPPIFG-W-----SRYWPHGLKTSCGPD -9== VCKPFGN-VRFDAKLAIVGIAFSWIWAAVW-TAPPIFG-W-----SRYWPHGLKTSCGPD -10== VCKPFGN-VRFDAKLAIVGIAFSWIWSAVW-TAPPIFG-W-----SRYWPHGLKTSCGPD -11== VCKPFGN-IKFDSKLAIIGIVFSWVWAWGW-SAPPIFG-W-----SRYWPHGLKTSCGPD -12== VCKPFGN-IKFDGKLAVAGILFSWLWSCAW-TAPPIFG-W-----SRYWPHGLKTSCGPD -13== VCKPLGD-FQFQRRHAVSGCAFTWGWALLW-SAPPLLG-W-----SSYVPEGLRTSCGPN -14== ITRPMEG--KMTHGKAIAMIIFIYMYATPW-VVACYTETW-----GRFVPEGYLTSCTFD -15== ITRPMEG--KMTHGKAIAMIIFIYLYATPW-VVACYTESW-----GRFVPEGYLTSCTFD -16== ITKPMNR--NMTFTKAVIMNIIIWLYCTPW-VVLPLTQFW-----DRFVPEGYLTSCSFD -17== ITKPMNR--NMTFTKAVIMNIIIWLYCTPW-VVLPLTQFW-----DRFVPEGYLTSCSFD -18== ICNGFNG-PKLTTGKAVVFALISWVIAIGC-ALPPFFG-W-----GNYILEGILDSCSYD -19== ICNGFNG-PKLTQGKATFMCGLAWVISVGW-SLPPFFG-W-----GSYTLEGILDSCSYD -20== IVKGMAG-RPMTIPLALGKM---------------------------YVPEGNLTSCGID -21== IVKGMAG-RPMTIPLALGKIAYIWFMSSIW-CLAPAFG-W-----SRYVPEGNLTSCGID -22== IVKGMAG-RPMTIPLALGKIAYIWFMSTIWCCLAPVFG-W-----SRYVPEGNLTSCGID -23== IVKGING-TPMTIKTSIMKILFIWMMAVFW-TVMPLIG-W-----SAYVPEGNLTACSID -24== IVKGING-TPMTIKTSIMKIAFIWMMAVFW-TIMPLIG-W-----SSYVPEGNLTACSID -25== IVKGLSG-KPLSINGALIRIIAIWLFSLGW-TIAPMFG-W-----NRYVPEGNMTACGTD -26== IVRGMAA-APLTHKKATLLLLFVWIWSGGW-TILPFFG-W-----SRYVPEGNLTSCTVD -27== IGRPMAASKKMSHRRAFLMIIFVWMWSIVW-SVGPVFN-W-----GAYVPEGILTSCSFD -28== IGRPMAASKKMSHRRAFIMIIFVWLWSVLW-AIGPIFG-W-----GAYTLEGVLCNCSFD -29== ITRPLTYPVRQNGKCMAKMILSVWLLSASI-TLPPLFG-W-----AQNVNDDKVCLISQD -30== ITRPLTYPVRQNGKCMAKMILSVWLLSASI-TLPPLFG-W-----AQNVNDDKVCLISQD -31=p ITRPLTYPVRQNGKCMAKMILSVWLLSASI-TLPPLFG-W-----AQNVNDDKVCLISQD -32== ITDPIDYVNKRTPRRAAALISLTWLIGFLI-SIPPMLG-WRTPEDRSDPDA---CTISKD -33=p ITDPIDYVNKRTPRRAAALISLTWLIGFLI-SIPPMLG-WRTPEDRSDPDA---CTISKD -34== VTS-IDYIRRRSARRILLMIMVVWIVALFI-SIPPLFG-WRDP--NNDPDKTGTCIISQD -35=p VTS-IDYIRRRSARRILLMIMVVWIVALFI-SIPPLFG-WRDP--NNDPDKTGTCIISQD -36== VTN-IDYIHASTAKRVGMMIACVWTVSFFV-CIAQLLG-WKDPDWNQRVSEDLRCVVSQD - : : : +1== GVAFTWIMALAC-AAPPLVG-W-----SRYIPEGMQCSCGPDYYTLNPNFNNESYVVYMF +2== GVAFTWVMALAC-AAPPLVG-W-----SRYIPEGMQCSCGIDYYTLKPEVNNESFVIYMF +3== GIAFTWVMAFSC-AAPPLFG-W-----SRYMPEGMQCSCGPDYYTHNPDYHNESYVLYMF +4=p GIAFTWVMALAC-AAPPLFG-W-----SRYIPEGMQCSCGPDYYTLNPDYNNESYVIYMF +5=p GIAFTWVMAMAC-AAPPLVG-W-----SRYIPEGIQCSCGPDYYTLNPEYNNESYVLYMF +6== GCILPWISALAA-SLPPLFG-W-----SRYIPEGLQCSCGPDWYTTNNKYNNESYVMFLF +7== VVLATWTIGIGV-SIPPFFG-W-----SRFIPEGLQCSCGPDWYTVGTKYRSESYTWFLF +8=opsin, GIAFSWIWAAVW-TAPPIFG-W-----SRYWPHGLKTSCGPDVFSGSSYPGVQSYMIVLM +9== GIAFSWIWAAVW-TAPPIFG-W-----SRYWPHGLKTSCGPDVFSGSSYPGVQSYMIVLM +10== GIAFSWIWSAVW-TAPPIFG-W-----SRYWPHGLKTSCGPDVFSGSSYPGVQSYMIVLM +11== GIVFSWVWAWGW-SAPPIFG-W-----SRYWPHGLKTSCGPDVFSGSVELGCQSFMLTLM +12== GILFSWLWSCAW-TAPPIFG-W-----SRYWPHGLKTSCGPDVFSGSSDPGVQSYMVVLM +13== GCAFTWGWALLW-SAPPLLG-W-----SSYVPEGLRTSCGPNWYTGGSNN--NSYILSLF +14== MIIFIYMYATPW-VVACYTETW-----GRFVPEGYLTSCTFDYLT--DNFDTRLFVACIF +15== MIIFIYLYATPW-VVACYTESW-----GRFVPEGYLTSCTFDYLT--DNFDTRLFVACIF +16== MNIIIWLYCTPW-VVLPLTQFW-----DRFVPEGYLTSCSFDYLS--DNFDTRLFVGTIF +17== MNIIIWLYCTPW-VVLPLTQFW-----DRFVPEGYLTSCSFDYLS--DNFDTRLFVGTIF +18== FALISWVIAIGC-ALPPFFG-W-----GNYILEGILDSCSYDYLT--QDFNTFSYNIFIF +19== MCGLAWVISVGW-SLPPFFG-W-----GSYTLEGILDSCSYDYFT--RDMNTITYNICIF +20== KM---------------------------YVPEGNLTSCGIDYLE--RDWNPRSYLIFYS +21== KIAYIWFMSSIW-CLAPAFG-W-----SRYVPEGNLTSCGIDYLE--RDWNPRSYLIFYS +22== KIAYIWFMSTIWCCLAPVFG-W-----SRYVPEGNLTSCGIDYLE--RDWNPRSYLIFYS +23== KILFIWMMAVFW-TVMPLIG-W-----SAYVPEGNLTACSIDYMT--RMWNPRSYLITYS +24== KIAFIWMMAVFW-TIMPLIG-W-----SSYVPEGNLTACSIDYMT--RQWNPRSYLITYS +25== RIIAIWLFSLGW-TIAPMFG-W-----NRYVPEGNMTACGTDYFN--RGLLSASYLVCYG +26== LLLFVWIWSGGW-TILPFFG-W-----SRYVPEGNLTSCTVDYLT--KDWSSASYVVIYG +27== MIIFVWMWSIVW-SVGPVFN-W-----GAYVPEGILTSCSFDYLS--TDPSTRSFILCMY +28== MIIFVWLWSVLW-AIGPIFG-W-----GAYTLEGVLCNCSFDYIS--RDSTTRSNILCMF +29== MILSVWLLSASI-TLPPLFG-W-----AQNVNDDKVCLISQDF----------GYTIYST +30== MILSVWLLSASI-TLPPLFG-W-----AQNVNDDKVCLISQDF----------GYTIYST +31=p MILSVWLLSASI-TLPPLFG-W-----AQNVNDDKVCLISQDF----------GYTIYST +32== LISLTWLIGFLI-SIPPMLG-WRTPEDRSDPD---ACTISKDH----------GYTIYST +33=p LISLTWLIGFLI-SIPPMLG-WRTPEDRSDPD---ACTISKDH----------GYTIYST +34== MIMVVWIVALFI-SIPPLFG-WRDP--NNDPDKTGTCIISQDK----------GYTIFST +35=p MIMVVWIVALFI-SIPPLFG-WRDP--NNDPDKTGTCIISQDK----------GYTIFST +36== MIACVWTVSFFV-CIAQLLG-WKDPDWNQRVSEDLRCVVSQDV----------GYQIFAT + : -1== YYTLNPNFNNESYVVYMFVVHFLVPFVIIFFCYGRLLCTV----KE-------------- -2== YYTLKPEVNNESFVIYMFVVHFTIPMIVIFFCYGQLVFTV----KE-------------- -3== YYTHNPDYHNESYVLYMFVIHFIIPVVVIFFSYGRLICKV----RE-------------- -4=p YYTLNPDYNNESYVIYMFVCHFILPVAVIFFTYGRLVCTV----KA-------------- -5=p YYTLNPEYNNESYVLYMFICHFILPVTIIFFTYGRLVCTV----KA-------------- -6== WYTTNNKYNNESYVMFLFCFCFAVPFGTIVFCYGQLLITL----KL-------------- -7== WYTVGTKYRSESYTWFLFIFCFIVPLSLICFSYTQLLRAL----KA-------------- -8=opsin, VFSGSSYPGVQSYMIVLMVTCCITPLSIIVLCYLQVWLAI----RA-------------- -9== VFSGSSYPGVQSYMIVLMVTCCITPLSIIVLCYLQVWLAI----RA-------------- -10== VFSGSSYPGVQSYMIVLMVTCCIIPLAIIMLCYLQVWLAI----RA-------------- -11== VFSGSVELGCQSFMLTLMITCCFLPLFIIIVCYLQVWMAI----RA-------------- -12== VFSGSSDPGVQSYMVVLMVTCCFFPLAIIILCYLQVWLAI----RA-------------- -13== WYTGGSNN--NSYILSLFVTCFVLPLSLILFSYTNLLLTL----RA-------------- -14== YLT--DNFDTRLFVACIFFFSFVCPTTMITYYYSQIVGHVFSHEKA-------------- -15== YLT--DNFDTRLFVACIFFFSFVCPTTMITYYYSQIVGHVFSHEKA-------------- -16== YLS--DNFDTRLFVGTIFFFSFVCPTLMILYYYSQIVGHVFSHEKA-------------- -17== YLS--DNFDTRLFVGTIFLFSFVVPTLMILYYYSQIVGHVFNHEKA-------------- -18== YLT--QDFNTFSYNIFIFVFDYFLPAAIIVFSYVFIVKAIFAHEAA-------------- -19== YFT--RDMNTITYNICIFIFDFFLPASVIVFSYVFIVKAIFAHEAA-------------- -20== YLE--RDWNPRSYLIFYSIFVYYIPLFLICYSYWFIIAAVSAHEKA-------------- -21== YLE--RDWNPRSYLIFYSIFVYYIPLFLICYSYWFIIAAVSAHEKA-------------- -22== YLE--RDWNPRSYLIFYSIFVYYIPLFLICYSYWFIIAAVSAHEKA-------------- -23== YMT--RMWNPRSYLITYSLFVYYTPLFLICYSYWFIIAAVAAHEKA-------------- -24== YMT--RQWNPRSYLITYSLFVYYTPLFMICYSYWFIIATVAAHEKA-------------- -25== YFN--RGLLSASYLVCYGIWVYFVPLFLIIYSYWFIIQAVAAHEKN-------------- -26== YLT--KDWSSASYVVIYGLAVYFLPLITMIYCYFFIVHAVAEHEKQ-------------- -27== YLS--TDPSTRSFILCMYFCGFMLPIIIIAFCYFNIVMSVSNHEKE-------------- -28== YIS--RDSTTRSNILCMFILGFFGPILIIFFCYFNIVMSVSNHEKE-------------- -29== F----------GYTIYSTAVAFYIPMSVMLFMYYQIYKAARKSAAKHKF----------- -30== F----------GYTIYSTAVAFYIPMSVMLFMYYQIYKAARKSAAKHKF----------- -31=p F----------GYTIYSTAVAFYIPMSVMLFMYYQIYKAARKSAAKHKF----------- -32== H----------GYTIYSTFGAFYIPLLLMLVLYGRIFRAARFRIRK-------------- -33=p H----------GYTIYSTFGAFYIPLLLMLVLYGRIFRAARFRIRK-------------- -34== K----------GYTIFSTVGAFYLPMLVMMIIYIRIWLVARSRIRKDKFQMTKARLKTEE -35=p K----------GYTIFSTVGAFYLPMLVMMIIYIRIWLVARSRIRKDKFQMTKARLKTEE -36== V----------GYQIFATASSFYVPVLIILILYWRIYQTARKRIR--------------- - * : * : +1== VVHFLVPFVIIFFCYGRLLCTV----KEAAAAQQ-------------------------- +2== VVHFTIPMIVIFFCYGQLVFTV----KEAAAQQQ-------------------------- +3== VIHFIIPVVVIFFSYGRLICKV----REAAAQQQ-------------------------- +4=p VCHFILPVAVIFFTYGRLVCTV----KAAAAQQQ-------------------------- +5=p ICHFILPVTIIFFTYGRLVCTV----KAAAAQQQ-------------------------- +6== CFCFAVPFGTIVFCYGQLLITL----KLAAKAQA-------------------------- +7== IFCFIVPLSLICFSYTQLLRAL----KAVAAQQQ-------------------------- +8=opsin, VTCCITPLSIIVLCYLQVWLAI----RAVAKQQK-------------------------- +9== VTCCITPLSIIVLCYLQVWLAI----RAVAKQQK-------------------------- +10== VTCCIIPLAIIMLCYLQVWLAI----RAVAKQQK-------------------------- +11== ITCCFLPLFIIIVCYLQVWMAI----RAVAAQQK-------------------------- +12== VTCCFFPLAIIILCYLQVWLAI----RAVAAQQK-------------------------- +13== VTCFVLPLSLILFSYTNLLLTL----RAAAAQQK-------------------------- +14== FFSFVCPTTMITYYYSQIVGHVFSHEKALRDQAKK------------------------- +15== FFSFVCPTTMITYYYSQIVGHVFSHEKALRDQAKK------------------------- +16== FFSFVCPTLMILYYYSQIVGHVFSHEKALREQAKK------------------------- +17== LFSFVVPTLMILYYYSQIVGHVFNHEKALREQAKK------------------------- +18== VFDYFLPAAIIVFSYVFIVKAIFAHEAAMRAQAKK------------------------- +19== IFDFFLPASVIVFSYVFIVKAIFAHEAAMRAQAKK------------------------- +20== IFVYYIPLFLICYSYWFIIAAVSAHEKAMREQAKK------------------------- +21== IFVYYIPLFLICYSYWFIIAAVSAHEKAMREQAKK------------------------- +22== IFVYYIPLFLICYSYWFIIAAVSAHEKAMREQAKK------------------------- +23== LFVYYTPLFLICYSYWFIIAAVAAHEKAMREQAKK------------------------- +24== LFVYYTPLFMICYSYWFIIATVAAHEKAMRDQAKK------------------------- +25== IWVYFVPLFLIIYSYWFIIQAVAAHEKNMREQAKK------------------------- +26== LAVYFLPLITMIYCYFFIVHAVAEHEKQLREQAKK------------------------- +27== FCGFMLPIIIIAFCYFNIVMSVSNHEKEMAAMAKR------------------------- +28== ILGFFGPILIIFFCYFNIVMSVSNHEKEMAAMAKR------------------------- +29== AVAFYIPMSVMLFMYYQIY-------KAARKSAAKHKF---------------------- +30== AVAFYIPMSVMLFMYYQIY-------KAARKSAAKHKF---------------------- +31=p AVAFYIPMSVMLFMYYQIY-------KAARKSAAKHKF---------------------- +32== FGAFYIPLLLMLVLYGRIF-------RAARFRIRK------------------------- +33=p FGAFYIPLLLMLVLYGRIF-------RAARFRIRK------------------------- +34== VGAFYLPMLVMMIIYIRIW-------LVARSRIRKDKFQMTKARLKTEETTLVASPKTEY +35=p VGAFYLPMLVMMIIYIRIW-------LVARSRIRKDKFQMTKARLKTEETTLVASPKTEY +36== ASSFYVPVLIILILYWRIY-------QTARKRIR-------------------------- + * : * : -1== ------------------------------------------------------AAAAQQ -2== ------------------------------------------------------AAAQQQ -3== ------------------------------------------------------AAAQQQ -4=p ------------------------------------------------------AAAQQQ -5=p ------------------------------------------------------AAAQQQ -6== ------------------------------------------------------AAKAQA -7== ------------------------------------------------------VAAQQQ -8=opsin, ------------------------------------------------------VAKQQK -9== ------------------------------------------------------VAKQQK -10== ------------------------------------------------------VAKQQK -11== ------------------------------------------------------VAAQQK -12== ------------------------------------------------------VAAQQK -13== ------------------------------------------------------AAAQQK -14== ------------------------------------------------------LRDQAK -15== ------------------------------------------------------LRDQAK -16== ------------------------------------------------------LREQAK -17== ------------------------------------------------------LREQAK -18== ------------------------------------------------------MRAQAK -19== ------------------------------------------------------MRAQAK -20== ------------------------------------------------------MREQAK -21== ------------------------------------------------------MREQAK -22== ------------------------------------------------------MREQAK -23== ------------------------------------------------------MREQAK -24== ------------------------------------------------------MRDQAK -25== ------------------------------------------------------MREQAK -26== ------------------------------------------------------LREQAK -27== ------------------------------------------------------MAAMAK -28== ------------------------------------------------------MAAMAK -29== --------------------------------------------P----GFPRVEPDSVI -30== --------------------------------------------P----GFPRVQPESVI -31=p --------------------------------------------P----GFPRVQPESVI -32== -------------------------TVKKVEKTGADTRHGASPAP---------QPKKS- -33=p -------------------------TVRKVEKKGAGTSLGTSSAP---------PPKKS- -34== TTLVASPKTEYSVVSDCNGCNSPDSTTEKKKRRAPFKSYGCSPRPERKKNRAKKLPENAN -35=p TTLVASPKTEYSVVSDCNGCNSPDSTTEKKKRRAPFKSYGCSPRPERKKNRAKKLPENAN -36== ------------------------------RRRGATARGGVGPPP---------VPAGGA +1== ------------------------------------------------------------ +2== ------------------------------------------------------------ +3== ------------------------------------------------------------ +4=p ------------------------------------------------------------ +5=p ------------------------------------------------------------ +6== ------------------------------------------------------------ +7== ------------------------------------------------------------ +8=opsin, ------------------------------------------------------------ +9== ------------------------------------------------------------ +10== ------------------------------------------------------------ +11== ------------------------------------------------------------ +12== ------------------------------------------------------------ +13== ------------------------------------------------------------ +14== --------------------------------------------------MN-------- +15== --------------------------------------------------MN-------- +16== --------------------------------------------------MN-------- +17== --------------------------------------------------MN-------- +18== --------------------------------------------------MN-------- +19== --------------------------------------------------MN-------- +20== --------------------------------------------------MN-------- +21== --------------------------------------------------MN-------- +22== --------------------------------------------------MN-------- +23== --------------------------------------------------MN-------- +24== --------------------------------------------------MN-------- +25== --------------------------------------------------MN-------- +26== --------------------------------------------------MN-------- +27== --------------------------------------------------LN-------- +28== --------------------------------------------------LN-------- +29== ---------------------------------PGFPRV----EPDSVIALNG------- +30== ---------------------------------PGFPRV----QPESVISLNG------- +31=p ---------------------------------PGFPRV----QPESVISLNG------- +32== --------------TVKKVEKTGADTRHGASPAPQPKKS-----------VNGESGSR-- +33=p --------------TVRKVEKKGAGTSLGTSSAPPPKKS-----------LNGQPGSG-- +34== SVVSDCNGCNSPDSTTEKKKRRAPFKSYGCSPRPERKKNRAKKLPENANGVNSNSSS--- +35=p SVVSDCNGCNSPDSTTEKKKRRAPFKSYGCSPRPERKKNRAKKLPENANGVNSNSSS--- +36== -------------------RRRGATARGGVGPPP---------VPAGGALVAGGGSGGIA 1== ------------------------------------------------------------ @@ -280,217 +280,179 @@ 11== ------------------------------------------------------------ 12== ------------------------------------------------------------ 13== ------------------------------------------------------------ -14== KMN---------------VESLRS------------------------------------ -15== KMN---------------VDSLRS------------------------------------ -16== KMN---------------VESLRS------------------------------------ -17== KMN---------------VESLRS------------------------------------ -18== KMN---------------VSTLRS------------------------------------ -19== KMN---------------VTNLRS------------------------------------ -20== KMN---------------VKSLRS------------------------------------ -21== KMN---------------VKSLRS------------------------------------ -22== KMN---------------VKSLRS------------------------------------ -23== KMN---------------VKSLRS------------------------------------ -24== KMN---------------VKSLRS------------------------------------ -25== KMN---------------VASLRS------------------------------------ -26== KMN---------------VASLRA------------------------------------ -27== RLN---------------AKELR------------------------------------- -28== RLN---------------AKELR------------------------------------- -29== ALNG--------------IVKLQ----------------------KEVEECANLSR---- -30== SLNG--------------VVKLQ----------------------KEVEECANLSR---- -31=p SLNG--------------VVKLQ----------------------KEVEECANLSR---- -32== -VNGESGSRNWRL-----GVESKAGGALCANGAVRQGDDGAALEVIEVHRVGNSKEHLPL -33=p -LNGQPGSGDWRR-----CAENRAVGTPCTNGAVRQGDDEATLEVIEVHRVGNSKEHLPL -34== GVNSNSSS----------SERLKQIQIETAEAFANGCAEEASIAMLERQ-CNNGKKISSN -35=p GVNSNSSS----------SERLKQIQIETAEAFANGCAEEASIAMLERQ-CNNGKKISSN -36== LVAGGGSGGIAAAVVAVIGRPLPTISETTTTGFTNVSSNNTS---PEKQSCANGLEADPP +14== --VESL------------------------------------------------------ +15== --VDSL------------------------------------------------------ +16== --VESL------------------------------------------------------ +17== --VESL------------------------------------------------------ +18== --VSTL------------------------------------------------------ +19== --VTNL------------------------------------------------------ +20== --VKSL------------------------------------------------------ +21== --VKSL------------------------------------------------------ +22== --VKSL------------------------------------------------------ +23== --VKSL------------------------------------------------------ +24== --VKSL------------------------------------------------------ +25== --VASL------------------------------------------------------ +26== --VASL------------------------------------------------------ +27== --AKEL------------------------------------------------------ +28== --AKEL------------------------------------------------------ +29== --IVKL----------------------QK---------EVEECAN-------------- +30== --VVKL----------------------QK---------EVEECAN-------------- +31=p --VVKL----------------------QK---------EVEECAN-------------- +32== -------NWRLGVESKAGGALCANGAVRQGDDGAALEVIEVHRVGNSKEHLPLPSEAG-- +33=p -------DWRRCAENRAVGTPCTNGAVRQGDDEATLEVIEVHRVGNSKEHLPLPSESG-- +34== -------SERLKQIQIETAEAFANGCA----EEASIAMLERQ-CNNGKKISSNDTPYS-- +35=p -------SERLKQIQIETAEAFANGCA----EEASIAMLERQ-CNNGKKISSNDTPYS-- +36== AAVVAVIGRPLPTISETTTTGFTNVSS----NNTSP---EKQSCANGLEADPPTTGYGAV -1== --------------------ESASTQK------AEKEVTRMVVLMVIGFLVCWVPYASVA -2== --------------------ESATTQK------AEKEVTRMVIIMVIFFLICWLPYASVA -3== --------------------ESATTQK------AEKEVTRMVILMVLGFMLAWTPYAVVA -4=p --------------------DSASTQK------AEREVTKMVILMVFGFLIAWTPYATVA -5=p --------------------DSASTQK------AEREVTKMVILMVLGFLVAWTPYATVA -6== --------------------DSASTQK------AEREVTKMVVVMVLGFLVCWAPYASFS -7== --------------------ESATTQK------AEREVSRMVVVMVGSFCVCYVPYAAFA -8=opsin, --------------------ESESTQK------AEKEVTRMVVVMVLAFC---------- -9== --------------------ESESTQK------AEKEVTRMVVVMVLAFCFCWGPYAFFA -10== --------------------ESESTQK------AEKEVTRMVVVMIFAYCVCWGPYTFFA -11== --------------------ESESTQK------AEREVSRMVVVMIVAFCICWGPYASFV -12== --------------------ESESTQK------AEKEVSRMVVVMIVAYCFCWGPYTFFA -13== --------------------EADTTQR------AEREVTRMVIVMVMAFLLCWLPYSTFA -14== -------------------NVDKNKET------AEIRIAKAAITICFLFFCSWTPYGVMS -15== -------------------NVDKSKEA------AEIRIAKAAITICFLFFASWTPYGVMS -16== -------------------NVDKSKET------AEIRIAKAAITICFLFFVSWTPYGVMS -17== -------------------NVDKSKET------AEIRIAKAAITICFLFFVSWTPYGVMS -18== --------------------NEADAQR------AEIRIAKTALVNVSLWFICWTPYALIS -19== --------------------NEAETQR------AEIRIAKTALVNVSLWFICWTPYAAIT -20== --------------------SEDAEKS------AEGKLAKVALVTITLWFMAWTPYLVIN -21== --------------------SEDAEKS------AEGKLAKVALVTITLWFMAWTPYLVIN -22== --------------------SEDADKS------AEGKLAKVALVTISLWFMAWTPYLVIN -23== --------------------SEDCDKS------AEGKLAKVALTTISLWFMAWTPYLVIC -24== --------------------SEDCDKS------AENKLAKVALTTISLWFMAWTPYLIIC -25== --------------------SENQNTS------AECKLAKVALMTISLWFMAWTPYLVIN -26== -------------------NADQQKQS------AECRLAKVAMMTVGLWFMAWTPYLIIS -27== --------------------KAQAGAS------AEMKLAKISMVIITQFMLSWSPYAIIA -28== --------------------KAQAGAN------AEMRLAKISIVIVSQFLLSWSPYAVVA -29== --------------LLKHERKNISIFK------REQKAATTLGIIVGAFTVCWLPFFLLS -30== --------------LLKHERKNISIFK------REQKAATTLGIIVGAFTVCWLPFFLLS -31=p --------------LLKHERKNISIFK------REQKAATTLGIIVGAFTVCWLPFFLLS -32== PSEAG--PTPCAPASFERKNERNAEAKRKMALARERKTVKTLGIIMGTFILCWLPFFIVA -33=p PSESG--SNSYAPACLERKNERNAEAKRKMALARERKTVKTLGIIMGTFILCWLPFFIVA -34== DTPYS-------------RTREKLELK------RERKAARTLAIITGAFLICWLPFFIIA -35=p DTPYS-------------RTREKLELK------RERKAARTLAIITGAFLICWLPFFIIA -36== TTGYGAVAAAYYPSLVRRKPKEAADSK------RERKAAKTLAIITGAFVACWLPFFVLA - * . : +1== -------------ESASTQK------AEKEVTRMVVLMVIGFLVCWVPYASVAFYIFT-H +2== -------------ESATTQK------AEKEVTRMVIIMVIFFLICWLPYASVAMYIFT-H +3== -------------ESATTQK------AEKEVTRMVILMVLGFMLAWTPYAVVAFWIFT-N +4=p -------------DSASTQK------AEREVTKMVILMVFGFLIAWTPYATVAAWIFF-N +5=p -------------DSASTQK------AEREVTKMVILMVLGFLVAWTPYATVAAWIFF-N +6== -------------DSASTQK------AEREVTKMVVVMVLGFLVCWAPYASFSLWIVS-H +7== -------------ESATTQK------AEREVSRMVVVMVGSFCVCYVPYAAFAMYMVN-N +8=opsin, -------------ESESTQK------AEKEVTRMVVVMVLAFC----------------- +9== -------------ESESTQK------AEKEVTRMVVVMVLAFCFCWGPYAFFACFAAA-N +10== -------------ESESTQK------AEKEVTRMVVVMIFAYCVCWGPYTFFACFAAA-N +11== -------------ESESTQK------AEREVSRMVVVMIVAFCICWGPYASFVSFAAA-N +12== -------------ESESTQK------AEKEVSRMVVVMIVAYCFCWGPYTFFACFAAA-N +13== -------------EADTTQR------AEREVTRMVIVMVMAFLLCWLPYSTFALVVAT-H +14== ----------RSNVDKNKET------AEIRIAKAAITICFLFFCSWTPYGVMSLIGAF-G +15== ----------RSNVDKSKEA------AEIRIAKAAITICFLFFASWTPYGVMSLIGAF-G +16== ----------RSNVDKSKET------AEIRIAKAAITICFLFFVSWTPYGVMSLIGAF-G +17== ----------RSNVDKSKET------AEIRIAKAAITICFLFFVSWTPYGVMSLIGAF-G +18== ----------RS-NEADAQR------AEIRIAKTALVNVSLWFICWTPYALISLKGVM-G +19== ----------RS-NEAETQR------AEIRIAKTALVNVSLWFICWTPYAAITIQGLL-G +20== ----------RS-SEDAEKS------AEGKLAKVALVTITLWFMAWTPYLVINCMGLF-K +21== ----------RS-SEDAEKS------AEGKLAKVALVTITLWFMAWTPYLVINCMGLF-K +22== ----------RS-SEDADKS------AEGKLAKVALVTISLWFMAWTPYLVINCMGLF-K +23== ----------RS-SEDCDKS------AEGKLAKVALTTISLWFMAWTPYLVICYFGLF-K +24== ----------RS-SEDCDKS------AENKLAKVALTTISLWFMAWTPYLIICYFGLF-K +25== ----------RS-SENQNTS------AECKLAKVALMTISLWFMAWTPYLVINFSGIF-N +26== ----------RANADQQKQS------AECRLAKVAMMTVGLWFMAWTPYLIISWAGVF-S +27== ----------R--KAQAGAS------AEMKLAKISMVIITQFMLSWSPYAIIALLAQF-G +28== ----------R--KAQAGAN------AEMRLAKISIVIVSQFLLSWSPYAVVALLAQF-G +29== ----LSRLLKHERKNISIFK------REQKAATTLGIIVGAFTVCWLPFFLLSTARPFIC +30== ----LSRLLKHERKNISIFK------REQKAATTLGIIVGAFTVCWLPFFLLSTARPFIC +31=p ----LSRLLKHERKNISIFK------REQKAATTLGIIVGAFTVCWLPFFLLSTARPFIC +32== PTPCAPASFERKNERNAEAKRKMALARERKTVKTLGIIMGTFILCWLPFFIVALVLPF-C +33=p SNSYAPACLERKNERNAEAKRKMALARERKTVKTLGIIMGTFILCWLPFFIVALVLPF-C +34== -----------RTREKLELK------RERKAARTLAIITGAFLICWLPFFIIALIGPF-V +35=p -----------RTREKLELK------RERKAARTLAIITGAFLICWLPFFIIALIGPF-V +36== AAAYYPSLVRRKPKEAADSK------RERKAAKTLAIITGAFVACWLPFFVLAILVPT-C + * . : -1== FYIFT-HQGS--DFGATFMTLPAFFAKSSALYNPVIYILMNKQFRNCMITTLCC------ -2== MYIFT-HQGS--NFGPIFMTLPAFFAKTASIYNPIIYIMMNKQFRNCMLTSLCC------ -3== FWIFT-NKGA--DFTATLMAVPAFFSKSSSLYNPIIYVLMNKQFRNCMITTICC------ -4=p AWIFF-NKGA--DFSAKFMAIPAFFSKSSALYNPVIYVLLNKQFRNCMLTTIFC------ -5=p AWIFF-NKGA--AFSAQFMAIPAFFSKTSALYNPVIYVLLNKQFRSCMLTTLFC------ -6== LWIVS-HRGE--EFDLRMATIPSCLSKASTVYNPVIYVLMNKQFRSCMM-KMVC------ -7== MYMVN-NRNH--GLDLRLVTIPSFFSKSACIYNPIIYCFMNKQFQACIM-KMVC------ +1== QGS--DFGATFMTLPAFFAKSSALYNPVIYILMNKQFRNCMITTLCC--------GKNPL +2== QGS--NFGPIFMTLPAFFAKTASIYNPIIYIMMNKQFRNCMLTSLCC--------GKNPL +3== KGA--DFTATLMAVPAFFSKSSSLYNPIIYVLMNKQFRNCMITTICC--------GKNPF +4=p KGA--DFSAKFMAIPAFFSKSSALYNPVIYVLLNKQFRNCMLTTIFC--------GKNPL +5=p KGA--AFSAQFMAIPAFFSKTSALYNPVIYVLLNKQFRSCMLTTLFC--------GKNPL +6== RGE--EFDLRMATIPSCLSKASTVYNPVIYVLMNKQFRSCMM-KMVC--------GKN-I +7== RNH--GLDLRLVTIPSFFSKSACIYNPIIYCFMNKQFQACIM-KMVC--------GKA-M 8=opsin, ------------------------------------------------------------ -9== CFAAA-NPGY--PFHPLMAALPAFFAKSATIYNPVIYVFMNRQFRNCIL-QLF------- -10== CFAAA-NPGY--AFHPLMAALPAYFAKSATIYNPVIYVFMNRQFRNCIL-QLF------- -11== SFAAA-NPGY--AFHPLAAALPAYFAKSATIYNPVIYVFMNRQFRNCIM-QLF------- -12== CFAAA-NPGY--AFHPLAAALPAYFAKSATIYNPIIYVFMNRQFRNCIL-QLF------- -13== LVVAT-HKGI--IIQPVLASLPSYFSKTATVYNPIIYVFMNKQFQSCLL-EMLCCGY--- -14== LIGAF-GDKT--LLTPGATMIPACACKMVACIDPFVYAISHPRYRMELQKRCPWLAL--- -15== LIGAF-GDKT--LLTPGATMIPACTCKMVACIDPFVYAISHPRYRMELQKRCPWLAI--- -16== LIGAF-GDKS--LLTQGATMIPACTCKLVACIDPFVYAISHPRYRLELQKRCPWLGV--- -17== LIGAF-GDKS--LLTPGATMIPACTCKLVACIEPFVYAISHPRYRMELQKRCPWLGV--- -18== LKGVM-GDTS--GITPLVSTLPALLAKSCSCYNPFVYAISHPKYRLAITQHLPWFCV--- -19== IQGLL-GNAE--GITPLLTTLPALLAKSCSCYNPFVYAISHPKFRLAITQHLPWFCV--- -20== CMGLF-KF-E--GLTPLNTIWGACFAKSAACYNPIVYGISHPKYRLALKEKCPCCVF--- -21== CMGLF-KF-E--GLTPLNTIWGACFAKSAACYNPIVYGISHPKYRLALKEKCPCCVF--- -22== CMGLF-KF-E--GLTPLNTIWGACFAKSAACYNPIVYGISHPKYRLALKEKCPCCVF--- -23== YFGLF-KI-D--GLTPLTTIWGATFAKTSAVYNPIVYGISHPKYRIVLKEKCPMCVF--- -24== YFGLF-KI-D--GLTPLTTIWGATFAKTSAVYNPIVYGISHPNDRLVLKEKCPMCVC--- -25== FSGIF-NL-V--KISPLFTIWGSLFAKANAVYNPIVYGISHPKYRAALFAKFPSLAC--- -26== WAGVF-SSGT--RLTPLATIWGSVFAKANSCYNPIVYGISHPRYKAALYQRFPSLAC--- -27== LLAQF-GPAE--WVTPYAAELPVLFAKASAIHNPIVYSVSHPKFREAIQTTFPWLLTCCQ -28== LLAQF-GPLE--WVTPYAAQLPVMFAKASAIHNPMIYSVSHPKFREAISQTFPWVLTCCQ -29== TARPFICGTSCSCIPLWVERTFLWLGYANSLINPFIYAFFNRDLRTTYRSLLQC------ -30== TARPFICGTSCSCIPLWVERTCLWLGYANSLINPFIYAFFNRDLRPTSRSLLQC------ -31=p TARPFICGTSCSCIPLWVERTCLWLGYANSLINPFIYAFFNRDLRTTYRSLLQC------ -32== LVLPF-CESSC-HMPTLLGAIINWLGYSNSLLNPVIYAYFNKDFQNAFKKIIKC------ -33=p LVLPF-CESSC-HMPALLGAIINWLGYSNSLLNPVIYAYFNKDFQNAFKKIIKC------ -34== LIGPF-VDPE--GIPPFARSFVLWLGYFNSLLNPIIYTIFSPEFRSAFQKILFG------ -35=p LIGPF-VDPE--GIPPFARSFVLWLGYFNSLLNPIIYTIFSPEFRSAFQKILFG------ -36== ILVPT-CDCE---VSPVLTSLSLWLGYFNSTLNPVIYTVFSPEFRHAFQRLLCG------ +9== PGY--PFHPLMAALPAFFAKSATIYNPVIYVFMNRQFRNCIL-QLF---------GKK-V +10== PGY--AFHPLMAALPAYFAKSATIYNPVIYVFMNRQFRNCIL-QLF---------GKK-V +11== PGY--AFHPLAAALPAYFAKSATIYNPVIYVFMNRQFRNCIM-QLF---------GKK-V +12== PGY--AFHPLAAALPAYFAKSATIYNPIIYVFMNRQFRNCIL-QLF---------GKK-V +13== KGI--IIQPVLASLPSYFSKTATVYNPIIYVFMNKQFQSCLL-EMLCCGY----QPQR-T +14== DKT--LLTPGATMIPACACKMVACIDPFVYAISHPRYRMELQKRCPWLAL---------N +15== DKT--LLTPGATMIPACTCKMVACIDPFVYAISHPRYRMELQKRCPWLAI---------S +16== DKS--LLTQGATMIPACTCKLVACIDPFVYAISHPRYRLELQKRCPWLGV---------N +17== DKS--LLTPGATMIPACTCKLVACIEPFVYAISHPRYRMELQKRCPWLGV---------N +18== DTS--GITPLVSTLPALLAKSCSCYNPFVYAISHPKYRLAITQHLPWFCV------HE-T +19== NAE--GITPLLTTLPALLAKSCSCYNPFVYAISHPKFRLAITQHLPWFCV------HE-K +20== F-E--GLTPLNTIWGACFAKSAACYNPIVYGISHPKYRLALKEKCPCCVF------GK-V +21== F-E--GLTPLNTIWGACFAKSAACYNPIVYGISHPKYRLALKEKCPCCVF------GK-V +22== F-E--GLTPLNTIWGACFAKSAACYNPIVYGISHPKYRLALKEKCPCCVF------GK-V +23== I-D--GLTPLTTIWGATFAKTSAVYNPIVYGISHPKYRIVLKEKCPMCVF------GN-T +24== I-D--GLTPLTTIWGATFAKTSAVYNPIVYGISHPNDRLVLKEKCPMCVC------GT-T +25== L-V--KISPLFTIWGSLFAKANAVYNPIVYGISHPKYRAALFAKFPSLAC-------A-A +26== SGT--RLTPLATIWGSVFAKANSCYNPIVYGISHPRYKAALYQRFPSLAC------GS-G +27== PAE--WVTPYAAELPVLFAKASAIHNPIVYSVSHPKFREAIQTTFPWLLTCCQFDEKE-C +28== PLE--WVTPYAAQLPVMFAKASAIHNPMIYSVSHPKFREAISQTFPWVLTCCQFDDKE-T +29== GTSCSCIPLWVERTFLWLGYANSLINPFIYAFFNRDLRTTYRSLLQCQYR----NINR-- +30== GTSCSCIPLWVERTCLWLGYANSLINPFIYAFFNRDLRPTSRSLLQCQYR----NINR-- +31=p GTSCSCIPLWVERTCLWLGYANSLINPFIYAFFNRDLRTTYRSLLQCQYR----NINR-- +32== ESSC-HMPTLLGAIINWLGYSNSLLNPVIYAYFNKDFQNAFKKIIKCKFC----RQ---- +33=p ESSC-HMPALLGAIINWLGYSNSLLNPVIYAYFNKDFQNAFKKIIKCKFC----RR---- +34== DPE--GIPPFARSFVLWLGYFNSLLNPIIYTIFSPEFRSAFQKILFGKYR----RGHR-- +35=p DPE--GIPPFARSFVLWLGYFNSLLNPIIYTIFSPEFRSAFQKILFGKYR----RGHR-- +36== DCE---VSPVLTSLSLWLGYFNSTLNPVIYTVFSPEFRHAFQRLLCGRRV----RRRR-- -1== --GKNPLGDDE--SGASTSKTEVSSVS-TSPVS--------------------------- -2== --GKNPLGDDE--ASATASKTE------TSQVA--------------------------- -3== --GKNPFGDEDVSSTVSQSKTEVSSVS-SSQVS--------------------------- -4=p --GKNPLGDDE-SSTVSTSKTEVSS------VS--------------------------- -5=p --GKNPLGDEE-SSTVSTSKTEVSS------VS--------------------------- -6== --GKN-IEEDE--ASTSSQVTQVSS------VA--------------------------- -7== --GKA-MTDES--DTCSSQKTEVSTVS-STQVG--------------------------- +1== GDDE--SGASTSKTEVSSVS-TSPVSPA-------------------------------- +2== GDDE--ASATASKTE------TSQVAPA-------------------------------- +3== GDEDVSSTVSQSKTEVSSVS-SSQVSPA-------------------------------- +4=p GDDE-SSTVSTSKTEVSS------VSPA-------------------------------- +5=p GDEE-SSTVSTSKTEVSS------VSPA-------------------------------- +6== EEDE--ASTSSQVTQVSS------VAPEK------------------------------- +7== TDES--DTCSSQKTEVSTVS-STQVGPN-------------------------------- 8=opsin, ------------------------------------------------------------ -9== --GKK-VDDGS--ELSSASKTEVSSV---SSVS--------------------------- -10== --GKK-VDDGS--ELSSASKTEVSSV---SSVS--------------------------- -11== --GKK-VDDGS--EASTTSRTEVSSVS-NSSVA--------------------------- -12== --GKK-VDDGS--EVST-SRTEVSSVS-NSSVS--------------------------- -13== -QPQR-TGKAS--PGTPGPHADVTAAGLRNKVM--------------------------- -14== ---NE-KAPES----SAVASTSTTQEPQQTTAA--------------------------- -15== ---SE-KAPES----RAAISTSTTQEQQQTTAA--------------------------- -16== ---NE-KSGEI----SSAQSTTTQEQ-QQTTAA--------------------------- -17== ---NE-KSGEA----SSAQSTTTQEQTQQTSAA--------------------------- -18== ---HE-TETKS-NDDSQSNSTVAQDKA--------------------------------- -19== ---HE-KDPND-VEENQSSNTQTQEKS--------------------------------- -20== ---GK-VDDGK-SSDAQSQATASEAESKA------------------------------- -21== ---GK-VDDGK-SSDAQSQATASEAESKA------------------------------- -22== ---GK-VDDGK-SSEAQSQATTSEAESKA------------------------------- -23== ---GN-TDEPKPDAPASDTETTSEADSKA------------------------------- -24== ---GT-TDEPKPDAPPSDTETTSEAESKD------------------------------- -25== ----A-AEPSS-DAVSTTSGTTTVTDNEKSNA---------------------------- -26== ---GS-GESGS-DVKSEASATTTMEEKPKIPEA--------------------------- -27== FDEKE-CEDAN-DAEEEVVASER--GGESRDAAQMKEMMAMMQKMQAQQAAYQPPPPPQG -28== FDDKE-TEDDK-DAETEIPAGESSDAAPSADAAQMKEMMAMMQKMQQQQAAY----PPQG -29== ---QY-RNINR--KLSAAGMHEALKLAER------------------------------- -30== ---QY-RNINR--KLSAAGMHEALKLAER------------------------------- -31=p ---QY-RNINR--KLSAAGMHEALKLAER------------------------------- -32== ---KF-CRQ--------------------------------------------------- -33=p ---KF-CRR--------------------------------------------------- -34== ---KY-RRGHR------------------------------------------------- -35=p ---KY-RRGHR------------------------------------------------- -36== ---RR-VRRRR--A---------------------------------------------- - - -1== -----------------------------------PA----------------------- -2== -----------------------------------PA----------------------- -3== -----------------------------------PA----------------------- -4=p -----------------------------------PA----------------------- -5=p -----------------------------------PA----------------------- -6== -----------------------------------PEK---------------------- -7== -----------------------------------PN----------------------- -8=opsin, ------------------------------------------------------------ -9== -----------------------------------PA----------------------- -10== -----------------------------------PA----------------------- -11== -----------------------------------PA----------------------- -12== -----------------------------------PA----------------------- -13== -----------------------------------PAHPV-------------------- -14== ------------------------------------------------------------ -15== ------------------------------------------------------------ -16== ------------------------------------------------------------ -17== ------------------------------------------------------------ -18== ------------------------------------------------------------ -19== ------------------------------------------------------------ -20== ------------------------------------------------------------ -21== ------------------------------------------------------------ -22== ------------------------------------------------------------ -23== ------------------------------------------------------------ -24== ------------------------------------------------------------ -25== ------------------------------------------------------------ -26== ------------------------------------------------------------ -27== Y--PPQGYPPQGAYPPPQGYPPQGYPPQGYPPQGYPPQGAPPQVEAPQGAPPQGVDNQAY -28== YAPPPQGYPPQGY--PPQGYPPQGYPPQGYPP---PPQGAPPQ-GAPPAAPPQGVDNQAY -29== -----------------------------------PERPEFVL-QNADYCRKKGHDS--- -30== -----------------------------------PERSEFVL-QNSDHCGKKGHDT--- -31=p -----------------------------------PERSEFVL-QNSDHCGKKGHDT--- +9== DDGS--ELSSASKTEVSSV---SSVSPA-------------------------------- +10== DDGS--ELSSASKTEVSSV---SSVSPA-------------------------------- +11== DDGS--EASTTSRTEVSSVS-NSSVAPA-------------------------------- +12== DDGS--EVST-SRTEVSSVS-NSSVSPA-------------------------------- +13== GKAS--PGTPGPHADVTAAGLRNKVMPAHPV----------------------------- +14== EKAP--ESSAVASTSTTQEP--QQTTAA-------------------------------- +15== EKAP--ESRAAISTSTTQEQ--QQTTAA-------------------------------- +16== EKSG--EISSAQST-TTQEQ--QQTTAA-------------------------------- +17== EKSG--EASSAQST-TTQEQ-TQQTSAA-------------------------------- +18== ETKS--NDDSQSNSTVAQDK-A-------------------------------------- +19== DPND--VEENQSSNTQTQEK-S-------------------------------------- +20== DDGK--SSDAQSQA-TASEA-ESKA----------------------------------- +21== DDGK--SSDAQSQA-TASEA-ESKA----------------------------------- +22== DDGK--SSEAQSQA-TTSEA-ESKA----------------------------------- +23== DEPK--PDAPASDTETTSEA-DSKA----------------------------------- +24== DEPK--PDAPPSDTETTSEA-ESKD----------------------------------- +25== EPSS--DAVSTTSGTTTVTD-NEKSNA--------------------------------- +26== ESGS--DVKSEASATTTMEE-KPKIPEA-------------------------------- +27== EDAN--DAEEEVVASER--G-GESRDAAQMKEMMAMMQKMQAQQAAYQPPPPPQGY--PP +28== EDDK--DAETEIPAGESSDA-APSADAAQMKEMMAMMQKMQQQQAAY----PPQGYAPPP +29== ------KLSAAGMHEALKLAERPERPEF------------VLQNADY------------- +30== ------KLSAAGMHEALKLAERPERSEF------------VLQNSDH------------- +31=p ------KLSAAGMHEALKLAERPERSEF------------VLQNSDH------------- 32== ------------------------------------------------------------ 33=p ------------------------------------------------------------ 34== ------------------------------------------------------------ 35=p ------------------------------------------------------------ -36== -----------------------------------PQ----------------------- +36== ------A---------------PQ------------------------------------ -1== -- -2== -- -3== -- -4=p -- -5=p -- -6== -- -7== -- -8=opsin, -- -9== -- -10== -- -11== -- -12== -- -13== -- -14== -- -15== -- -16== -- -17== -- -18== -- -19== -- -20== -- -21== -- -22== -- -23== -- -24== -- -25== -- -26== -- -27== QA -28== QA -29== -- -30== -- -31=p -- -32== -- -33=p -- -34== -- -35=p -- -36== -- - +1== --------------------------------------------------------- +2== --------------------------------------------------------- +3== --------------------------------------------------------- +4=p --------------------------------------------------------- +5=p --------------------------------------------------------- +6== --------------------------------------------------------- +7== --------------------------------------------------------- +8=opsin, --------------------------------------------------------- +9== --------------------------------------------------------- +10== --------------------------------------------------------- +11== --------------------------------------------------------- +12== --------------------------------------------------------- +13== --------------------------------------------------------- +14== --------------------------------------------------------- +15== --------------------------------------------------------- +16== --------------------------------------------------------- +17== --------------------------------------------------------- +18== --------------------------------------------------------- +19== --------------------------------------------------------- +20== --------------------------------------------------------- +21== --------------------------------------------------------- +22== --------------------------------------------------------- +23== --------------------------------------------------------- +24== --------------------------------------------------------- +25== --------------------------------------------------------- +26== --------------------------------------------------------- +27== QGYPPQGAYPPPQGYPPQGYPPQGYPPQGYPPQGAPPQVEAPQGAPPQGVDNQAYQA +28== QGYPPQGY--PPQGYPPQGYPPQGYPP---PPQGAPPQ-GAPPAAPPQGVDNQAYQA +29== --------------------------------------------CRKKGHDS----- +30== --------------------------------------------CGKKGHDT----- +31=p --------------------------------------------CGKKGHDT----- +32== --------------------------------------------------------- +33=p --------------------------------------------------------- +34== --------------------------------------------------------- +35=p --------------------------------------------------------- +36== --------------------------------------------------------- +