# HG changeset patch
# User iuc
# Date 1525306691 14400
# Node ID bdfc22c1c3e366cb896c473451dc146c9a38a79e
# Parent 5673e72241aa573a40093c7b82a8d7942c1d06f7
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/repeat_masker commit 8dacb4321122d92df0983e0794cf23572be03224
diff -r 5673e72241aa -r bdfc22c1c3e3 RepeatMasker.xml
--- a/RepeatMasker.xml Tue Sep 17 03:23:49 2013 -0400
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
@@ -1,307 +0,0 @@
-
- Masks different kind of repeats
-
- RepeatMasker
-
-
-## The command is a Cheetah template which allows some Python based syntax.
-## Lines starting hash hash are comments. Galaxy will turn newlines into spaces
-
-## create temp directory
-#import tempfile, os
-#set $dirname = os.path.abspath( tempfile.mkdtemp() )
-#set $input_filename = os.path.split( str($query) )[-1]
-#set $output_basename = os.path.join( $dirname, $input_filename )
-
-
-RepeatMasker
--parallel 8
-
-$nolow
-$noint
-$norna
-
-#if str($species)!="all":
- $species
-#end if
-
-
--dir $dirname
-
-#if $adv_opts.adv_opts_selector=="advanced":
-
- #if str($adv_opts.gc)!="0":
- -gc $adv_opts.gc
- #end if
-
- $adv_opts.gccalc
-
- #set $output_files_list = str($adv_opts.output_files).split(',')
- #if "gff" in $output_files_list:
- -gff
- #end if
- #if "html" in $output_files_list:
- -html
- #end if
-
- $adv_opts.slow_search
- $adv_opts.quick_search
- $adv_opts.rush_search
- $adv_opts.only_alus
- $adv_opts.is_only
-
-#else:
- ## Set defaults
- -gff
-
-## End of advanced options:
-#end if
-
-$query
-
-2>&1;
-
-## Copy the output files to galaxy
-## AgR: if there are no repeats, the output files may not exist.
-## This causes the job to fail, so touch files to ensure they exist.
-#if $adv_opts.adv_opts_selector=="advanced":
-
- #if "summary" in $output_files_list:
- ## Write out the summary file (default)
- #set $summary_file = $output_basename + '.tbl'
- touch $summary_file;
- cp $summary_file $output_summary;
- #end if
-
- #if "gff" in $output_files_list:
- ## Write out the gff file (default)
- #set $gff_file = $output_basename + '.out.gff'
- touch $gff_file;
- cp $gff_file $output_gff;
- #end if
-
- #if "html" in $output_files_list:
- ## Write out the html file
- #set $html_file = $output_basename + '.out.html'
- touch $html_file;
- cp $html_file $output_html;
- #end if
-
-#else:
-
- ## Write out the summary file (default)
- #set $summary_file = $output_basename + '.tbl'
- touch $summary_file;
- cp $summary_file $output_summary;
-
- ## Write out the gff file (default)
- #set $gff_file = $output_basename + '.out.gff'
- touch $gff_file;
- cp $gff_file $output_gff;
-
-
-## End of advanced options:
-#end if
-
-## Write out mask sequence file
-#set $mask_sequence_file = $output_basename + '.masked'
-touch $mask_sequence_file;
-cp $mask_sequence_file $output_mask;
-
-## Write out standard file (default)
-## The default '.out' file from RepeatMasker has a 3-line header and spaces rather
-## than tabs. Remove the header and replace the whitespaces with tab
-#set $standard_file = $output_basename + '.out'
-tail -n +4 $standard_file | tr -s ' ' '\t' > $output_std;
-
-## Delete all temporary files
-rm $dirname -r
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
- (adv_opts['adv_opts_selector'] == 'advanced' and 'mask' in adv_opts['output_files'])
-
-
-
- (
- (adv_opts['adv_opts_selector'] == 'advanced' and 'summary' in adv_opts['output_files'])
- or
- (adv_opts['adv_opts_selector'] == 'basic')
- )
-
-
-
- (adv_opts['adv_opts_selector'] == 'advanced' and 'html' in adv_opts['output_files'])
-
-
-
- (adv_opts['adv_opts_selector'] == 'advanced' and 'gff' in adv_opts['output_files'])
-
-
-
-
-
-.. class:: warningmark
-
-**What it does**
-
-RepeatMasker is a program that screens DNA sequences for *interspersed repeats*
-and *low complexity* DNA sequences. The output of the program is a detailed
-annotation of the repeats that are present in the query sequence as well as a
-modified version of the query sequence in which all the annotated repeats have
-been masked (default: replaced by Ns).
-
------
-
-**How to read the results**
-
-
-
-The annotation file contains the cross_match output lines. It lists all best matches
-(above a set minimum score) between the query sequence and any of the sequences in
-the repeat database or with low complexity DNA. The term "best matches" reflects
-that a match is not shown if its domain is over 80% contained within the domain
-of a higher scoring match, where the "domain" of a match is the region in
-the query sequence that is defined by the alignment start and stop. These domains
-have been masked in the returned masked sequence file. In the output, matches are
-ordered by query name, and for each query by position of the start of the alignment.
-
-Example:
-
-======== ========= ========= ========= ========== =========== ========= ========= ============ =============== =================== ================ ============== ======= ==
-SW score perc div. perc del. perc ins. query seq. q-pos begin q-pos end (left) w complement matching repeat repeat class/family repeat-pos begin repeat-pos end (left) ID
-======== ========= ========= ========= ========== =========== ========= ========= ============ =============== =================== ================ ============== ======= ==
- 1306 15.6 6.2 0.0 HSU08988 6563 6781 \(22462) C MER7A DNA/MER2_type 336 103 \(0) 1
- 12204 10.0 2.4 1.8 HSU08988 6782 7714 \(21529) C TIGGER1 DNA/MER2_type 2418 1493 \(0) 2
- 279 3.0 0.0 0.0 HSU08988 7719 7751 \(21492) + (TTTTA)n Simple_repeat 1 33 \(0) 3
- 1765 13.4 6.5 1.8 HSU08988 7752 8022 \(21221) C AluSx SINE/Alu 289 1 \(23) 4
- 12204 10.0 2.4 1.8 HSU08988 8023 8694 \(20549) C TIGGER1 DNA/MER2_type 1493 827 \(925) 5
- 1984 11.1 0.3 0.7 HSU08988 8695 9000 \(20243) C AluSg SINE/Alu 305 1 \(5) 6
- 12204 10.0 2.4 1.8 HSU08988 9001 9695 \(19548) C TIGGER1 DNA/MER2_type 827 2 \(1591) 7
- 711 21.2 1.4 0.0 HSU08988 9696 9816 \(19427) C MER7A DNA/MER2_type 122 2 \(224) 8
-======== ========= ========= ========= ========== =========== ========= ========= ============ =============== =================== ================ ============== ======= ==
-
-This is a sequence in which a Tigger1 DNA transposon has integrated into a MER7 DNA transposon copy.
-Subsequently two Alus integrated in the Tigger1 sequence. The simple repeat is derived from the
-poly A of the Alu element. The first line is interpreted like this:
-
-:Table description:
-
-1. **1306** = Smith-Waterman score of the match, usually complexity adjusted
- The SW scores are not always directly comparable. Sometimes
- the complexity adjustment has been turned off, and a variety of
- scoring-matrices are used.
-
-#. **15.6** = % substitutions in matching region compared to the consensus
-#. **6.2** = % of bases opposite a gap in the query sequence (deleted bp)
-#. **0.0** = % of bases opposite a gap in the repeat consensus (inserted bp)
-#. **HSU08988** = name of query sequence
-#. **6563** = starting position of match in query sequence
-#. **7714** = ending position of match in query sequence
-#. **(22462)** = no. of bases in query sequence past the ending position of match
-#. **C** = match is with the Complement of the consensus sequence in the database
-#. **MER7A** = name of the matching interspersed repeat
-#. **DNA/MER2_type** = the class of the repeat, in this case a DNA transposon fossil of the MER2 group (see below for list and references)
-#. **2418** = starting position of match in database sequence (using top-strand numbering)
-#. **1465** = ending position of match in database sequence
-#. **(0)** = no. of bases in (complement of) the repeat consensus sequence prior to beginning of the match (so 0 means that the match extended all the way to the end of the repeat consensus sequence)
-#. **1** = Identifier
-
-An asterisk (\*) in the final column (no example shown) indicates that there is
-a higher-scoring match whose domain partly (<80%) includes the domain of this match.
-
-Note that the SW score and divergence numbers for the three Tigger1 lines are identical.
-This is because the information is derived from a single alignment (the Alus were deleted
-from the query before the alignment with the Tigger element was performed).
-The program makes educated guesses about many fragments if they are derived from
-the same element (e.g. it knows that the MER7A fragments represent one insert).
-In a next version I can identify each element with a unique ID, if interest exists
-(this could help to represent repeats cleaner in graphic displays).
-
-
--------
-
-**References**
-
-Smit, AFA, Hubley, R and Green, P. RepeatMasker Open-3.0.
-
-http://www.repeatmasker.org/
-
-
-
diff -r 5673e72241aa -r bdfc22c1c3e3 readme.rst
--- a/readme.rst Tue Sep 17 03:23:49 2013 -0400
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
@@ -1,63 +0,0 @@
-===============================
-Galaxy wrapper for RepeatMasker
-===============================
-
-This wrapper is copyright 2013 by Björn Grüning.
-
-This is a wrapper for the command line tool of RepeatMasker from the Institute for Systems Biology.
-http://www.repeatmasker.org/
-
-
-Smit, AFA, Hubley, R & Green, P. RepeatMasker Open-3.0.
-1996-2010 .
-
-
-Additional Information:
-Using RepeatMasker to identify repetitive elements in genomic sequences.
-http://www.ncbi.nlm.nih.gov/pubmed/19274634
-
-============
-Installation
-============
-
-To install RepeatMasker, please use the following instructions:
-
-http://www.repeatmasker.org/RMDownload.html
-
-To install the wrapper copy the file RepeatMasker.xml in the galaxy tools
-folder and modify the tools_conf.xml file to make the tool available to Galaxy.
-Add a line like the following:
-
-Add the tool definition to your tool_conf.xml file under Galaxy root.
-
-
-=======
-History
-=======
-
-- v1.1: Initial public release
-- v0.1.1: patch from Simon Guest, to create empty files if no repeat is found
-- v0.1.2: remove trailing semicolon, redirect all output to stdout
-
-===============================
-Wrapper Licence (MIT/BSD style)
-===============================
-
-Permission to use, copy, modify, and distribute this software and its
-documentation with or without modifications and for any purpose and
-without fee is hereby granted, provided that any copyright notices
-appear in all copies and that both those copyright notices and this
-permission notice appear in supporting documentation, and that the
-names of the contributors or copyright holders not be used in
-advertising or publicity pertaining to distribution of the software
-without specific prior permission.
-
-THE CONTRIBUTORS AND COPYRIGHT HOLDERS OF THIS SOFTWARE DISCLAIM ALL
-WARRANTIES WITH REGARD TO THIS SOFTWARE, INCLUDING ALL IMPLIED
-WARRANTIES OF MERCHANTABILITY AND FITNESS, IN NO EVENT SHALL THE
-CONTRIBUTORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY SPECIAL, INDIRECT
-OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS
-OF USE, DATA OR PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE
-OR OTHER TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE
-OR PERFORMANCE OF THIS SOFTWARE.
-
diff -r 5673e72241aa -r bdfc22c1c3e3 repeatmasker.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/repeatmasker.xml Wed May 02 20:18:11 2018 -0400
@@ -0,0 +1,230 @@
+
+ RepeatMasker
+
+
+ repeatmasker
+
+
+ '${output_log}' &&
+ mv rm_input.fasta.tbl '${output_table}' &&
+ #if $gff == '-gff':
+ mv rm_input.fasta.out.gff '${output_gff}' &&
+ #end if
+ #if $advanced.keep_alignments == '-ali':
+ mv rm_input.fasta.align '${output_alignment}' &&
+ #end if
+ #if $advanced.poly == '-poly':
+ sed -r 's/^ *// ; s/ *$//; s/\+ //; s/ +/\t/g' rm_input.fasta.polyout >'${output_polymorphic}' &&
+ #end if
+ #end if
+ mv rm_input.fasta.cat '${output_repeat_catalog}'
+ ]]>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ not advanced['is_only']
+
+
+ not advanced['is_only']
+
+
+ not advanced['is_only']
+
+
+
+ not advanced['is_only'] and advanced['keep_alignments']
+
+
+ not advanced['is_only'] and advanced['poly']
+
+
+ not advanced['is_only'] and gff is True
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ @misc{RepeatMasker,
+ title = {RepeatMasker Open-4.0},
+ howpublished = {\url{http://www.repeatmasker.org}},
+ author = {Smit, AFA and Hubley, R and Green, P.},
+ year = {2013-2015}}
+
+
+
diff -r 5673e72241aa -r bdfc22c1c3e3 test-data/repeats.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/repeats.fasta Wed May 02 20:18:11 2018 -0400
@@ -0,0 +1,64 @@
+>Asian_seabass_ONSAT_SB_Concensus_Lenght_170_bp
+CGAAAAATTTAATAATTTAGGGGTCTTGAGCATGGGCGTGGTAAAATGCCCTCGGTAGCG
+CCACCTACATTTTTAAACGGAACAGCCCCTCAAGCCCGTTGCGCCTAAAAATCTGAAAAT
+CTGCACACATATGTAACATCCCATGACGCACCAAAAAGTCTCTTGGAGCCA
+>Asian_seabass_MOSAT_SB_T_34a_satellite_DNA
+TTTGTGACATCACTACATAGTTTGTTGAAAACGTAC
+>Asian_seabass_MOSAT_SB_T_34b_satellite_DNA
+TTTGTGACATCACACATAGTTGTGGGTCAGTAC
+>Sat_38
+AAAAAATGTCATAGTATAGTATGGCGTCAAAAAACATG
+>Asian_seabass_Sat_217_Consensus_Length_217_bp
+AGTAAACAAGCATTATGGTTGAAACCATAATTTCCTGTCGGGAGAGCCTTTCCCTCTTTT
+GTGCACTGTATGCAATCCCAGAGTGTGAATAAGCGCTTTTCCAGCGTTTTGAGGCTTATT
+CAGCTCAGAATGGCTTAATACTGCACTATCTGACCAGGACAAAGACAAACTAAGAACTCA
+GCCACACGGACATGAAAGTTGTTTTACTTACAATATT
+>Asian_seabass_Sat_217_Consensus_Length_427_bp
+CCAGCGTTTTGAGGCTTATTCAGCTCAGAATGGCTTAATACTGCACTATCTGACCAGGAC
+AAGACAAACTAAGAACTCAACACACTGACATGAAAGTTTCTATATTTCTATTAAAATAAA
+CAAACATTATGGTTGAAACCATAATTTCATTTCGGGAGAGCCTTTCCCTCTTTGTGGCAC
+TGTATGTAATCTGAAGTGTGAATAACGCTTTTCCCGCGTTTGAGGCTTATTCAGCTCAGA
+ATGGCTTAATACTGCACTATCTGACCAGGACAAGACAAACTAAGAACTCAGCCACACGGA
+CATGAAAGTTGTTTACTTTACAATATTAGTAAACAAGCATTATGGTTGAAACCATAATTT
+CCTGTCGGGAAGAGCTTCCCTCTTTTTGTGCACTGTATGCAATCCCAGAGTGTGAATAAG
+CGCTTTT
+>Asian_seabass_Sat_LM_Consensus_Length_453_bp
+CCCAACAAAATAGCACTTACTGCTTTCCAAATTCAAGTCTGTGCCTGTGTTAGGGTAATG
+TTGGTGATAAATTGATGTACTTAGCTTATCCTGTGAAAATGGTGTAAAATGGCAGTCTCC
+ATGTTTGTTGAAGAAACTCACAACCAAGACAACCCCAAAGAGAAGCACTTATGAAGACAG
+AAATCATGAGTGGCTCTTATTGAAGTGATCAGAGTTGGACTCCATTAAGAAAATGGCTTT
+CAATGTAGTCAGTTGCTTTGTCACTTAAAACTGCCCCAACAAGTAGCACTTACTGCAATT
+TGGTAGTCAAAGTCAATGCTCAAGTTAAGGGTAATAGTAGTGACATAATAGAAAAATCTC
+TAAATATATTTGCTGGCAGCTTTAATATACAGAATGAGTGCCATGATGAATTCTTGATAC
+AGAACAGGGACTTCCAAAATCAGCCAACACTAA
+>Asian_seabass_Sat_LM_Consensus_Length_218_bp
+CCCAACAAAATAGCACTTACTGCTTTCCAAATTCAAGTCTGTGCCTGTGTTAGGGTAATG
+TTGGTGATAAATTGATGTACTTAGCTTATCCTGTGAAAATGGTGTAAAATGGCAGTCTCC
+TGTTTGTTGAAGAAACTCACAACCAAGACAACCCCAAAGAGAAGCACTTATGAAGACAGA
+AATCATGAGTGGCTCTTATTGAAGTGATCAGAGTTGG
+>Asian_seabass_Sat_LM Consensus_Length_150_bp
+CTCACAACCAAGACAACCCCAAAGAGAAGCACTTATGAAGACAGAAATCATGAGTGGCTC
+TTATTGAAGTGATCAGAGTTGGACTCCATTAAGAAAATGGCTTTCAATGTAGTCAGTTGC
+TTTGTCACTTAAAACTGCCCCAACAAGTAGCA
+>Asian_seabass_Sat_Unk_Consensus_Length_341_bp
+GTTTGGGTAAAAATATTGTCTATTTACGAGCTATCCTCTATATATTTTTGATCTGATTAA
+TAAATACCTCTAGCCCACAAACTGTGGTATTTTGCTATGTGGCAGTTCACCCGAAAGTCC
+AGTAGCATTTATCGCATTTTCTAAAGATAGTCAGTGCCTGAAAGTTTGAGGCAGATAAAC
+AAATTGTTCAAGTAAGAACTATATCTTTCTTATGATTTTACCGCAATCATACAGGTTGTT
+TCTTGTGGTCTGCTGGGCATTGTATCCCTTTGTTGTATGGATTTTTCCTTTCTTTAATGA
+TCTCCTCCCTGGAGTTTGTAATCCCTGTTTGTAGTGGAATT
+>Asian_seabass_Sat_Unk_Consensus_Length_789_bp
+CAAAAAAATGGAAAAAAAAAAAGTGGCTCATTTGAAGTGAATCAGAGTTGGGTAACATTG
+TCCTTAATTACAGCTATGCTTATATACTTGATCTGATAATAATACTCTAGCCACAATCTG
+TGGGTATTCTGCTATTTGCAGTCCACCCAAAGTCATAGCATTTAATCCATTCTAGGAAGA
+TACGTCAGTGCTGAGTTGAGCCAATAACACCAAATTGTCATAAGAACTATTATTTTCTTT
+ATGATTTTTACGCATCAGTACAGGTGTTTTCTTGTGGTTTCTGCTGCATGTATCCCTGTT
+GTAAGTGGATTCTCCTTTGCTTATGATCTCCTCCGCTGCGTTGTATCCTGTTTGTAGTGG
+ATTTCCTTGCACTGATTCTGCCCGCTCTTAATACTGAATGAACGCCCTCCCACCAGTAGT
+ACTGCCACCTTTGTTTTTTCACAAAGTGTTCAATGGCCTTGATAATGACTTGGTAACTAC
+ATCACCACTTTTTTGTACGTAATCAACAGACAATCACCCATTAAATTCATGCGGCCATTA
+GGCAGCTTGATGAGCTGGACATTTGACCTCCCCAATGAATCTTTGCTGATGGGAAACTTA
+TTGCCACCATAAAGTGAACCAGCATTGCTATGTCCATGCTGTAATTTGAAAACCCAATAC
+AAAGAAGCCCTGCATATATACCTCCCAAATTGGCTTCTGAGACCCGGGCGTAATCACTGC
+ATGGCCATAGATAAACATTGAAATCTTCTGTTGCAGTCAGTTTGCTTTTTGTCAACTTTA
+AAAACTGCC
diff -r 5673e72241aa -r bdfc22c1c3e3 test-data/small.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/small.fasta Wed May 02 20:18:11 2018 -0400
@@ -0,0 +1,238 @@
+>scaffold_1
+TGCTTTTCTGAGATTTATGTCAGCTCCCCATTGGGAGATACAGGAGAATCCAATATATTC
+CTGTCTCGCTTCTTTTATATTTATCCTTTCTACACCTGACATCCTCAGTGATTGAAGTGA
+CAAAAAGTGGAGCGCACGCAGTGGTCATTACCCTCCAATGGTACTTCTAATTAAGGAAAG
+ATTTTTTGCATTCACTGAGCAAAACACTTATTTGCATGAATGGAAAATCATAAATGAGGG
+GTCCATTAAACAAATTTCCTAATTGTTTGCTTTTTTTTCTTCCTACTTCACCATCCCTCT
+AAAGCTATTACTCTCTATTCTACCCCATTATCGAGTGCACAAACACCAGCCCCAAATTGT
+CTTATCTCTGCTTTGATAAATGATATTTTTTTCTCTTATAATTGTGTTTCTCTCTAGATG
+TGCGGTGTCCATCAAGACACTGGATGTCACGTGGTCACTCCTGTGAAGAGCGAACTGTGT
+GGAACCCGAAGTACTGTGTGGTTGCTGACTGTCAGATGCTGCTTCTGAATGAGGAGGAGG
+TGGTGAGAGCAGACAGCACAATCTCTTGTCTGGCATGTTCCTCTGTGTCACCATTGTCTC
+TCTCATCTGCTCGTGTGTGTGTGTGTGTGTGTCCTTGTCAATGTCATTACACAATTTATG
+TTGGTGCACTGCATGTCAGAGTCTGAACTTTGTTGGACATCTACTTTCTGTCACCTGATA
+CCTCATACTTTACACTCTAATCCCTTTTTCCTTTCTAACTGCTGCTGTGTTAAGCTGTCA
+TATTAATATACTAAATAATGATAATATTAATTCTAATAATGATAGTGAATGGAGATTCAC
+AATGAAGAAACACAAGGTCCAGACTGAACCCCTGTGCTGTGTGAAGAGTTCACTCTACAT
+TTACATTCATCCCACATCAGAGACCAGCAATAGCCAGGTTAAGCAGAGCAAGGCTGAGTC
+TGGCTCTTTGCCTCTGTTGTTTTGATTAGTGTCACACTGGATTATGCTAGTTTGTGTGAG
+ATTAGAGGTCCTGTTGTTACGAGCAAATCAGCAGTCAGCAGGGTAATCTAAATTACATTG
+TTCTGTCGGCAATATCCTCTCCTCGCTCAACAGCTTTGTGTGAGCTCATATTTAAAGCCC
+CCACAGTAGTGCAGTGCATAAAATCATGCAGATACAGATCAGAAGCTTCAGGTAATGTTT
+ACATCAAACATCAGGGGGAAAATGTGATCTCAGTGCCTCTGACCGTGGTGTGATTGTTGG
+TGCCGGACAGGCTGGTTTGAGTATTTCTAAAACTGCTGATCTCCTGGGATTTTCACACAC
+GGCATTCTCTAGAGTTTACTCAGAACGGTGTGGAAAGCAAAAAAACATCCCGCGAGCTGC
+AATCCTGCGGATGGAAACACCTTGTTGATGGGATATGTCAGAGGAATGGCCAGGCTGGAT
+CAATCTGACAGAAAGGCGGTAACTCAGATAAGCACTCTCTACAACTGTGGTGAGCAGAAA
+AGCGTTCTCAGAATGCACAACACGTTCAACCTTGAGGAAGATGTTGCTACAGCAGCAGAT
+GAAGACCACGTCTGGTTCCACTCCTGTCAGCCAAGAACATCTCAGACTGCACAGGACACC
+AAAACAAAAACACATCCTGTTTTCTACTGGTGGTAGAGTCACAATTTGGCAATAAGATAA
+ATCCATGGACCCAACTTGCCTTGTGTCAATAGACCAAGCTGCTGGTGGTCTTGGGGAATG
+TTTTCTTTACACTTTCACACTATCGGCCTATATAAAATCCTATTATAAACTGCTGTACAG
+TGCATTGGGTTTGATAAGCCCTCTAAGTCTGTATATCATGATCTCATTGATACCTGCGGC
+AATACACCCCCACAAACGCAGCTCCCTGCATTTTAAGTATTATAGAGAGTAATTTCACTG
+TCCATGTCTTTTTTGATCATAAAGCAGGTCTAGGTGCTGTATACAACACTGTATTGAAAT
+GCTGAAGCAGGTCTAGGTGCTGTATACAACACTGTATTGAAATGCTGAAGCCAATATATC
+AATCTATCTGTCTATATTTTATGAAATATCAGAGCATTTTAGTCCAAATTTGTCTGTTTT
+GTTCATTGCAATGCTGACTGCTTAACATTTTCCTCAGTGGTGGCCATCACCACAGCATTT
+ACTGGTGAGTTTTACCAAGCTACAGTGGGCCACAATGAGTTACCTGTTATTGGCCTGGCT
+CTATGGCATGCAGAAAACAGTCAGCCAATCAGAGGACAGACTCAGAGACAGACACAAAGT
+GCCCTGTTCTTGTTAGAGCAGAGATAAATGAGACAGAGGAGATGTAAAACTATACTGAGA
+TGGTTTTTTGGTTCTTAAAACCACAAATATATTGTATTACGGATATCAAAACTTCAAATA
+AAACCAGTAAAGTGTAAAACATGGGACCTCTAAATGAAGGGCTGTTTTGTTTCGTAGTTC
+TAGATTATGTCACTATGTGGCCTCGGTCTCTGTCTGCGTAAAGCGGCTACATGTAGAATT
+TGACCCACTTTGGTGCCCACATATGGTAACTAAAACACTACAGACAGTATGCACTCCAAC
+CCTATATAATTTATGTCCTTCAGTGAAGCCTACAAAATGTGCAGCATGATTTGCTATGAT
+TAATACCTAGAATTATATTAAATTTTAGAAGTTTAGAGAGATGGCTTATACCTTTTTCTG
+AGCATGGAGTCATCTCATGTAATTTGTCACATACCTTTGGCCAGCTTAAACCTGGTCATT
+CCAGTGAGAGCTGCTCACCCAAATGTTTCTGTATGCACCTCCTGCTGTGGGTGCCAATAG
+CTCATGCAAGTTGGTGTCTTTCAACTAAGGCCACTATGTGAGGACCATCAGCAGCAAATT
+AAATTAGAAGTGCCTTGGAGTTTCTCAGGCCCTCTTCTATGATCATTAAGGTCTCAGTGA
+CAGAACAGTGCCCCTTTGAGGGACTATGGCATCTTGAGCACTTAAGTTGGCCGAATGTTT
+GATCTCAAATATGAGTGCACTGTTTCAAAGTCACAAAAGCCTCTGGACAAGGCATAGTTA
+CTGGGCTTGGTTAACCTTTTTTTCATACCGGCGTGACTGCTGGAACTTGGAACATGTAGC
+CTAAGTTTCCCTTTGTCTGCAATTACTGAGGTATGCCATGTTGAAATAGAACAATAATTG
+CAGGGAGGAATTATTCCAATCGACCCATCGGCAGGCTTTCCAATACAGTGCTTTTTGTTT
+CACAGCAACAAAGAACAAGAGCTTTTAAATGCATCCATCTGGACCCTGACTATGAAAGGT
+CATTGGTAACGCTGCTGGATTTCTGTTATGTCAGCAAACTGCAGGTCAAAGCGATGATAC
+AGTCTTATAATGGCTTTCTCCAAGTGAAGGTGGGATAACATGGTTTAAACAAGCTCAGTT
+AAATGGATCAGAGCATCAACTGCTGTGAACAAGCAATCACACGGTCAAGGTCAAACATTT
+ACACTTCTGAGAGATCTGGAGAGTATGTCATGGCAGTATTGCTTTTCAGTTATTTCAGTA
+ACTGATTACGCCTTGTACTTAGTCTCAGAATTAGTGATTTGATTCAAAGTGTTTTATATA
+TGTATATTTCAAAGCAAAAATACAGCTTAGGTAAAGCTCCTTAGACTCATGCAGCCTAAT
+TTACTGTAGACATTCCTCCATGTACAGTACTGTGCAAATGTTTTAGGCAGTTTTAGGCAC
+TAAAGGTGAACTGAGGATGCAGTCCCACGATTAATTTTTATTCATCAGTTAACCTCATGT
+GAAGTGTAGTAAACAGAAAAAACCTAAATCAGATCAGTATTTCTTATGACCCCCCTCCCC
+TACCACCCATCTTTAAAACAGCTCCAGTTCTCCTCAATCCCCCTGTACTTAGGTAGTTTT
+TTTCTAGCGTCTTGGAGAAGTTGCCTCAGTTCTTCTGTGGATTTTAGGCTGTCTCTGTGT
+CTTCTGTCTCCTCATGTATTCTCAGACTGACTCCATGATGTTGAGATCAGGGCTCTGTGG
+TGGGGGGGTCAGACCATCTGTTGCGGGACTCCTTGTTCTTCTTGTCTCTGAGGATAGTTC
+TTTATGATGCTGACTGTGTGATTGGACTCATTGTCCTGCTGCAGAATTAATCTGGGACTG
+ATCAGACATCTCCCTGATTGTACTGACAAAGGATAAGAGCAAAAACCTGTAGACTGCCTA
+AAACTTCTGCACAGTACTGCACAATACTGTATGTATGTGTGATAATACTCAGAAGTGATA
+TAGAGTGGTTCAGGAGAAGCCTTAACTTACTTGTTCTTCTTTTCCCTATGATGCAATTTC
+TCTCCAAGCAAACAGTACATAATGAAATATGTCTAAGAAAACACTAGCTGTTTGTCTTTT
+TGAAACACATTTAATAATTCAGATTTAGCCACAAATTAAAAATGAGCTTATACTTTGAAC
+TTGCCCATTGGTTTTGATGTATGAAGCTGACAGATTTAGTCCACTGCATACTGCACTTTT
+TTGGATAGTGAAATAAATTAATTTATTATGCAGCATTTAAGCATATTGCTGTTATCTAGA
+ATTTTATATATTAATAGGTATATATTATATTAACTCTTCATTTGCTTAAATTTGGCCTGT
+ATATTCCTCCATTTTATACAACCTTTAGAAAACACTGGAGTGAACAAAAATGTGAGGTTC
+AAAAGTGAGAGGAAAGAAAAATCAGTGTGTGCAGCAAGACTGTAAGAGTCCCTGAACAAA
+AGTGTTGATTTATTGTTGGCTGTGAAAGTTTTTGCTGCAGGGGTTTTTGTAAACAGTGAC
+TCTTCTTTATGTCTTTGTTTCTATCTTTTTGTGTTTTCTTTTTTCATCTTATTCTATTTT
+TCTCTCTCTCTCTTCGGTCAGTTTCTCTTCTTCTCCTCCTCATACTCATGCTTCTCTTTT
+ACTCTAATGGAAAACATAGAATTGAGGTGCAGTATCACTGAGAACAGCCAATGCTGATAC
+TGTCATTTGTTATAGGATGTTTACTTAAGAAATGATTGTGGCCTTATTTGCCAAAGACGA
+TTAGGCCCTGAGCCATTTGTACAGCCAATGTGACACCTCCGTAACCATAAGAAAAATTAT
+GCTTCCACAAACAGAAAGAGAGACAAATACAGACAGTGAAAGCAAAACTATGAGAGAAGG
+GATAGCCATCTCAGCATTCAGCCAGTGTGTCACATGTCCAGAGGGCTGCAATATGAAGCC
+AATAAACTGAGAGAAAGGTGTGATTCCAGAGGGCTTTCCGGACTTTAAACTTTTCTCATT
+TTCACCTTCAGCTCGTTGTGAAGCCTTCAATTGTTCCTTGGTCACATGAAGCCCCCTGTG
+TGTAAAATTGACATTCAGCTTATTACTCTCATCTACATCTCTAAAGTTGCACATGACTGC
+CAGTAGAGGGTGCTCATGATTTGAGACAAGTAACTTTTCTGTGCTTGTGTCAACAGTTAA
+AAATTCCCTATGGATACTTGAAAGAAATGCACCAGTGTTTAAATTTAGACTCAGTCCAAG
+TAGGCTTTGCCATTTGCTTTACTGTTGTAATCAAATCAGTGCTCACAGTACATCAGTGGC
+AAAAGCAATTAGCTTAATTGAGTTAGTAGGGAGTGAAAAGATAGATCACTATTTCCTGGC
+AGCGATATATTTTTCTCAGTTAACCTTCTCACAGAAAATTAGTTAGATGAGTTTCTTATC
+TCATTAGAACCATTGTTGTTTATTATTTAAACCTGACCTTTATCCAGAGAATGTTTTTCA
+CAGTAAGCATGTGTTTCACTCCAGCTCATACAGACACACCTTGTGGCCAGTCAGGGAATG
+TGCATTAAAACTAATGTTCTCTCTGGTAGAGCCATTCTGCCTATTCTGTTATTCACCAAA
+ACTTTCCTGCCCAGATTTTTCCATCTAGTCAGGGGACTTTTTCCTCAGCTGAACTGTCAG
+TAGCCAGCTGCTCTGACCTTTACTCACCTCAGAGATTACTCATTCAAGTTATTTTACCAA
+TGATGGAATAAAGTGAATACACACATCGTGACTTCATCATACTTTCCCTCCTTTACCGTA
+CTTTCCTAACATCAGTTAGCAAATTATACACTTAAATATGCTAAAATAGAGATTTGTTTC
+AAATTGAAGAGCAACACAGGACACATTTGCTTACACAAGTGACTCTATCTTATTTTTTAA
+GTGGCTGTCATCCTCAATATCATCAATATTTTAGGCATGTGAATGTAGGTAATGAGTATT
+ACTAATTAATAATTGGATGAGTTTATGAATTCATCATTAAATAAGATTATTATGATAAAG
+CTACACATTATACTGCAATTCCGGGCCAACACTATTGTTTCGCCCTTACAGTACAGGACT
+GTACATATCACTGTCACTACAAATTGTTTCAGTGAGGCTCAGATTACAGCTCATCTTGCT
+TAGTCATTACGGCTCAGACCACCAGACAATGTCTTTACGTCAGAGAAAGTCTGAGTGAGA
+GCTGTCCTTAAAACCAAGTCCCATGAGGCAAGTAAAGAGGTGACTCGCTGAGAGGATCAG
+GGAGAGGGACAGAGAGATAAACAGACAGACATGGAAACAGAGGGACATAGAAAACAAGAC
+AGAGAGGGTGCTGCATTGAGTCGAGAGGTGTGAGGATGTTCGATAAGCCATTATCACTCT
+GCTCGGAGGACGTCAGGCCCTATCCTTTTTTCTTTGAGTCACCACTTTCTCACCACAGCC
+ATCCTTCTTCCTTTGTCTGTTTAATCTTTTGCAGCCAAACATTTGGTATGCAAACTATAG
+GAAGATATGGTCTGACACCGACTGATGTGATGCTAATGCCTTCTCTGTTTTATCCAATGA
+CTCCTCATTTATCAGGACCAATCCAGCTATTGTGTGCTATTGGCCCAACACAGCATTAAA
+CATGGTGACCAGAATAGCCACAGCAAAATAAATAACGGGCCTCTGTGACTATTGTATGTG
+CATTTCTTACAGCTGTCATTTTTCTTTTCTGTTAGCTTTCATTCTACTGTGCGTGCTCTC
+TATCTGCCTACGTTGTATCTGTGCCTTTTGTTAAATTCATTCAGCCTTTTATCTGTCTTG
+AATTTCTTTCTCTGTGTCCTCCTTTCCCTCTCTGTCTCAGCAGATCCGTCCCTTGTTTTT
+GCAGGAGAAGCGCTCTGCGTCATGCAAGGTCCATCTTCTGCGACGCACCATCAGCGTTCC
+AGTGGAAACACAGTTTCCAGAACTCCATAGCCAGCTGTCCACTGAGAGCGGTGAGTAGCC
+TGAGGACATGCCTCTGCTGTGATTAGCATGCATCATTATTTCCATACACACACTGGAAAT
+CTTTTAATCGTTTTTCTTGACACAATTTAATTAATTTAAATAATTAATAACATTGAAATC
+AACTGTTAAACACTTGTTCAACATGGTTGTGGACAAAATCATCATAATGACTGTGGAGAC
+TAAGGAGAAACAATGCTTTGTTAAAATCTTTGCTCTGGTTTTGGCTTTTTCTATATTCTA
+TTTGTGTGTGCAGTGCTGCTAAACATCATCTTAGTCAGAGTCAAACTTGAGCACTCATGC
+AGATGCTTGTTCTATTCAGTGGTCAAATGGGCAGTGTAGCTTAGGAGAAGCACTTCTTTC
+CGCTCCTCAGTGACATAACCAGTCACACACTCACACAGGCAAGTGAGCCTTTTAAAATTG
+CTGATACTATTTTTTTCTACTTCATATCCACTAGATGGAGAGCTTGGTGCTTTGTAGCAC
+TCCAGTGTACTTGGAATGTTTCATCATAACCACTAAGGCAGACATTGATAAAGGCTTCGG
+TCTCTTTCAAACTGCAGGTGTCATGTTGCACTCTCCCTATTGCTTTTATGAAAATGTAGT
+GCCGGTAATATAACACAGTTACTCTCTGCATATATCACTATGTACACTTACTTCTATGGA
+AAAGATGGAGCGCCACAGTGAAAACTGTTTTGAGTCTGTGAGGGGAAAACACAGCATCAG
+TCACAGTGAAACACTAGGTGGCACTCAGGTTTGACATTCAAGCATTTGTATCCCACAGTT
+ACTGTTGCTGGGTTGTTGGCTGGCATGCAACTTAATATGATCTATCTTTAAATCAGTGTG
+TGCAGTGGTTATTTAGTTTAAGTGCTTTTTAATGATGTCACAACATTATTTTGTCTACAC
+CCTGCATACAGCACAGTATATTAAATTTAGGTTTTATTAAGTTAAGTAATGTTCTGAGGT
+GGCATTGCCCTCAGGTATATATCCCTCAGGCAGTGTTACTGGACAGCATATAGATTGTAA
+TGTTGTGTAAGCAGTGTTGTGTAAGCTTTTTTAACCAAAATGCTCTCATGTTTCTTTGTT
+ACCACAGTGGTTTTAGTGATGTTTTGTGCTGTGAACAGAATCATGATTTCTGCAGACACT
+CCACATCTGTTTAAACAGTGATTTTCACATCTGTCTGTAACTGAGTCAGTCAGTTTGTGG
+TTGGATTGATGTGTAGTGGGATCTACAGATCATCAACCCTCGGGGAAGCCATTTAGTTCT
+GTGTTAAATAAAAATACAACTTTTGAGCACTGTTTTTTCATATTTTTCTTCATCCCTTAG
+TTGATATTAAAGGTGCTATATGTAGATTTTTGCTATCACTACATAGCCAATGTTAGGATT
+AAGAACCCCAGCAACCCGAATGTTAACTCGTACTTTGCTTCTATTTCTATTACATATTTT
+CTTCTATGGAAGTTAGGATGTTAACCAGCTAACCCCAGGTCATCTCATAATACCACTTGG
+CAATAGTCAGTCACTGTTGCATTCAGTCTGCCCCTCCAGCATGAAAGGATGAAGAAGTAC
+CGCTACCCAGAAGGCGTAGTCTAACCCCTTGTCTTGTAAACACAGCAATGGCTGAAGCTC
+TTGGTAAGTAAACAGCTGTTAATGTCAGTGTTGGCTACATAGCTAAAACTTACACATAGC
+ACCGTTAAAAAAATAAATGGTAAGTTTTTGTCCTTTTAGTTAAAGCATGTAAATGTCAGT
+TAAAACAATTTAGAAAATTTCTCATTCAAATAGTCATTTTATTTTGTGTGCTATAAATAC
+CTTCAGTTTTTTTTCTTGTACTTTATTTTAAACTCTTGTCTTTCTCTTATGCCCCTTATC
+TACCAGGAGAGGTCACACTCTTGTTGATAGCATGATAAGGAAATGAGCAGAGATGTCCTT
+ATTTCTCCTCAAAGTTATTCCCTGCATAGCACATATTTGACTTTAAAAATACAAAGACTA
+CAGGTGCTAAATCACACACACAACACCCAAAAGAATAGAGGACTTTTAAATATGTGCATC
+CCATTTTCTAATCTATATTCACCACTGATACAAGTGATGACACGGTGATGAGAAAATAAC
+GTAACATACATTATTATACAAGATTGGTATGATTGCTGTAGGTTGGTTTTGTTTATCTGA
+GAAGGGACAGAGGCTAAAAGAATAAACAAAGTCTGCCAGCTACTTCACTAATTACAGAGT
+ACCCCTGCAACTCTGCCAATGACATTCTGAAACTTTTCCATGACTATTATGTAAGATAAT
+TTTTGAATCACTGATTCAGATTTCCATAGCCAAGATACACTATTCTGCATGTTGGCTAGA
+ATACATTACAATACATTAATATATTACTGTAGTGGTTATTATGTCAGCCATTTAAACATA
+ATTTCATACTTTCAGCTGTTCGCAGGGCAAACTTTTTATTTTTGTCACCTGAATCCAGTT
+GCATTTGGATTTGAATTCAGTGGTGACTGCCAATGAAAAATAACTCACAGGGGCACTTAG
+AGATCTGAGGCGGCATTGACTGAACATCGAAGGGCTACTATTACAGAAATGCAAGTGGAA
+AAAGAATCTGATATGATACTTGCCAGTATGAAAAGCATAATTAGGACTTTAAATGCATGT
+TTTAAATGTTTTTGTGAACCATAATTTCAGTGTAAAAGTTCCAGTTATATTTTAAAAGGA
+ACTCCAAATATCCAGTGGTAGCATCAAGGTAACCTGAGATAAGTGAAAAGTAATTCTAAA
+TTAATCAGTATGTTGAAATATCAGACATTTGTGTGCATTATTGTTAGTGTGACCATGGTG
+GGATACTTCAAACACACTTGTTCATTGGCAAAATAATTGTCACATGAATTAACACAAGTG
+ACACTTTCAGTATCATACTGACAGAATGTTTGTTGTTAACTTTATCCCTGAAAACAAACA
+CTAATACATGTTCTTGTCGCCCCTTCAGTGCCTAACCTTTAAAATTGTGCTTGTGAGTGT
+GTGTATGTGAGCGCACCTGTATGGTTTTCAAATAATGTTCCACATCACAACACTACAAAC
+ACTCACATGGTCTATGTTTTACTAAATTATTCATTGGCGTAGGCCCCACCTGCTCTTGTC
+CTTGTGTGACACAGGCTCTAAATAAGCAGCATGATGAATAAAAATGACACTGAGATGAAT
+AGGAATCCACAGCAAATCAGAGAGCACTCTCATCTCGTCTCATCCTCCGACTGAATAGCG
+AGCGGCTGCCTCCTTTATTCTTTTGAACTCTTCGCGGTTTTGGCACAAACATGCCAGAGA
+CAGAGAGCGCTGTTACGCTCCCACCAGAGCAACTACGCTTAATTTTACTGAGGTGAAAGT
+TTTTTTTTTTTTTCTGGATAAAGCTTTGGAAAAGTTCTCAACTGTTGCTTCTTTAAAGAT
+GCTGGGGCATATTCTGCCCTATTTTCCAGTTTTTTACATCTCCCATAAATATTTTCACAA
+GCTGTAACATTTTAGACAGGATTAAATTGAACTAGATAACTGACCAAAGGCTGCTAAATT
+ATTTTTATGTGCCTTGTAGCACAAATACTGTCTCACATATATTTTAAGTATCTTAATATT
+CCCTCTGATGTTTAATTTAACAAAGCTGTCCTTCCCTCCATCTCTCTCCTCATAGTTTTT
+CATTACAATTAGCTCTCATTAGATAGAATTGTATTTGTTGTCTTTGTGCCAGTCACTCCA
+GTCTATTTTGCCAGCACACAACTAAATAATTGTTTTGCCTTGTCAGTGTCTTGTTTTACA
+GTTTTAATGATGAGCCCAAAACATGTCAAATATGAGGAACTATAACTTATCAAGAAAGTG
+GGGTAGTTGAGATAAAACTGTTTCCGAGGTGGAGGTTGGCTGAGCTCCATTTGGCCACAA
+AATGTAGCTGAAAGGGCAGAGAAACCCACTTTAATGGAGTACAGGTTGCATATGAGCTGG
+TAGGAAAGATATAGAATCATTATCAGCTGATAATCTAACAGTAGCAGTCAGTGTAGATGC
+TGTGCTAACGCAAAGTTGTGAAACTACTGTCTGTAAGCAACTCATCCAATTGTTATTGCT
+GCCAAGCTTAAGTATTTTAACAGCTTTTAGGTGTTGTTAGCACAGTACTCGTTTGGATCC
+GGCCATGACAAGAAATCTTTATCGGCCACTAATTTAATTAATCATCTTTTTTCAAGCAAA
+AATCACAAACTTTCTTTGGTTCCACTTTTTCTCATTGTAGATTAAATATCTTTTGGGTTT
+TGGCACAGGCTGGACAAAAAAACCTCTGAGACGCTGTGATAAGAATTTATTTTCACATTT
+TTTTTACTTTTCAGGGACTACACAATTATTTGGTGATGAAAATAATATTTTGTTGCAGCC
+CAAATGTTAACTTGCCACTCAAGCTGTCAATTCAAGAAGGCAAAAGCAACAAATACTGCT
+TTGCCGAGCTGAAATGAGAGTAGAAACCATGCCCGGGCCAGCTCAGCCTGGTCAGGTTTT
+TGAGTCCATCTATTGTTAACATTCAGGTTGCAGCACAAGGGAAGTTCCTAAATTCTTCTG
+GCATGTTAATGTTTTCCAAACTGATGTTACCAAGTCCTCGTTATGATGAGAAAAAAATAT
+GCTGAGAGTGAAATTGATCAAAGTGGAAACATTAAGCACTGCCACAGTCCCCTCCACCCA
+TCTTTCTCCCTCTCTCTCCACCGCAACGTGGAAACTGCTCCTCTCTCTCTCTCCCTCTCC
+CTCTCCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCCTCCCTCCCA
+TTCTGTGCTCCGGTATACTCGCTCTCTCACTCTCTCCCTCTCTCCCCACTCTCCAGAGAG
+GGGTTCAGTCAGACAGATGTAACACAGCAGTAGAAGCCTGAGCTGAGCTGGCAGGCTGCG
+GAGGCCAGACCAGAGCCAGCAGCTCTGACTGGAGAGAACAGCGAAGAGGTGACGGCAGCA
+GCGGCAGCACAGGGGATAAAACAGTAGTTGTAGTAGCAGTTTCAGTAGTTGTACTTCAGT
+TACAGAGCTGACTTTACCTCAGGATATGGGTGTGTTGATCTGGGCGCTCATCACCCTGTG
+AATTTAACATGGACCCTGACACCAGCACCCATCCAGAGACACAACATGGTGAGTGAGATT
+TGAAGGAGGAAAAGATTAGAAACAATGAGAGTGATACTGTGGGAAAAGTTGAGGAGCGTG
+TTAGTGAACAAGGGAGTCAGGTCACATGGTTTTCCCGTTAGGGTTGCTATTATGACTAGG
+CTCTCCATTTGGCTCTAAAGCTGTTGACTAGGGCCTCTGTGGTCAAATGAATAGGACTTC
+AGTCTGTTCTGTTGAGTAGGGGGTGAAGGGGTGAGGGGTGTTACATGGCAATGTGATGAA
+ATCAACTGCCTGCTTAAGACATTTTGCTCTAATGACCCTCTTGTCATTACTTTAACAGGG
+TTGTAAAGTTTTTTTTGCTTTTTTGTAGCTAAGAAAGTTGAGAATTGTTTTGTCTGAACT
+CTCTCTGGGATTTGTCTTGTCGGTTTTTGGCTGGTTTTTGGTGTGAGCTTCACAGAGCAG
+GAAGCTCTCCTCCTGCTCTTTGAATGGAATAATTAACTGTGAGGGCCGTGGGTGTACCAT
+TTCTGCTCAAAAGCAGCAAGATAATTTGATGGTTATGTGAATCTGTATATTTGTATGCTG
+TGTAGTGGTGCTGCATGTGGGTGTTTGTGTTAGAGACACAGAGGGGCACCAAAGAATGAA
+AGTGGGAGACAGAGGGAACGAGAAGGGGAGAGACCGAGAGAGAAGGACTTATGTACACAA
+ATAAATCCAGGGGGATCTAGACTGCACTGTAGGCCAGTGCGAATGCTCACTCTTTCTCTT
+CCCCCTCATTTTCCGCTGCCTCTTTTTTTTCCTCCACTGCTCCAAATGTTGGAGCCCAAA
+CTAGATAGTTAAAAGGCAGAAAAAAATGGTGTGTTATTAACTGGGCCAGAAAAGACGATG
+TTTTGTCTTCATGGCCGATGGGAAGGACTCTGCTGTGCTGCTGATGAAGAATGTGGTTAA
+CAGAATGAGTCAACAGAGAACATATTTCCAAGAGACTGTAGTTTCTCTTCGCCAGCGTCT
+AAGCCACATTGCTTTATGCACTGGGCTCTCTGCCATGACGGCGAAGGAGAGACAAAGAGA
+GGGGAAAGAGAATCGCTAAAGATAAAACTCTGTTTTTATCCATCTCCTGAGACACAAAAC
+TTCTGTTAGCAATCTAACCAAATAAGCGAGAACATTAAGCTTCTTCTCACCTTCCCAAAA
+TAAAATGTCAACTTCATGCAGTAATACTCACTCTCTTCTCTCAACCAGTCAGCCAGCCTC
+TTTCAGTGCATACAGCTTGAGGAGATCCCTTCTAAAGGTCCAATATAAATAGAAAAGTGG
+GAGTAGAAAGGGCAATAATCTGATATCATCTGATTACATTCACACCTCAGGCTTGCACGC
+TACAGGAAGAGTTCACGCTTCCCAAGGCTTGCAGGCATCACTTTTCACTCATTCTCAGAT
+AGACACACAAACACATGCACAGAAATATCATTGCTGTTGTTTGCAACAAATCCTGGAGTA
+GACTACTTTGCATTGAATTTCTATATGCATGTGTTTTCATATATTACACATTGCTTTTTG
+TACTTTGCATATAAAGTAGATGCTGATCTGCTATCTGCATATATAGTAGCTGCAGATAGC
+ACTGTAACTACATCTACATATTTCTTGTTTGTATCTACATCAAGCAGATAGTTGCTGATG
+CTGGACAACCTCTTCCGATATTCATTATTTTGGAAAAAAAAATATCAATGGCATTCCTAC
+CTTACAACTTAAATTAAAAGTGGTCACTTGAGTAACTGCAGAACATGTGTTCACCCAATA
+GTTTTTTTTAGAGAGTGTCACTCAAAGTATTCCTCCTTACAAGCACCCATGCCTAAATCA
diff -r 5673e72241aa -r bdfc22c1c3e3 test-data/small.fasta.align
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/small.fasta.align Wed May 02 20:18:11 2018 -0400
@@ -0,0 +1,104 @@
+18 0.00 0.00 0.00 scaffold_1 613 632 (13519) (GT)n#Simple_repeat 1 20 (0) m_b1s252i0 1
+
+ scaffold_1 613 GTGTGTGTGTGTGTGTGTGT 632
+
+ (GT)n#Simple_ 1 GTGTGTGTGTGTGTGTGTGT 20
+
+Matrix = Unknown
+Transitions / transversions = 1.00 (0/0)
+Gap_init rate = 0.00 (0 / 19), avg. gap size = 0.0 (0 / 0)
+
+
+16 18.30 2.22 2.22 scaffold_1 780 824 (13327) (ATAATA)n#Simple_repeat 1 45 (0) m_b1s252i1 2
+
+ scaffold_1 780 ATATTAAT-ATACTAAATAATGATAATATTAATTCTAATAATGATA 824
+ v - v - i v vv i
+ (ATAATA)n#Sim 1 ATAATAATAATAAT-AATAATAATAATAATAATAATAATAATAATA 45
+
+Matrix = Unknown
+Transitions / transversions = 0.40 (2/5)
+Gap_init rate = 0.05 (2 / 44), avg. gap size = 1.00 (2 / 2)
+
+
+12 23.88 4.55 0.00 scaffold_1 2231 2274 (11877) (CAGA)n#Simple_repeat 1 46 (0) m_b1s252i2 3
+
+ scaffold_1 2231 CAGA-AAACAGTCAGCCAATCAGA-GGACAGACTCAGAGACAGACA 2274
+ - i v v iv -i vv v
+ (CAGA)n#Simpl 1 CAGACAGACAGACAGACAGACAGACAGACAGACAGACAGACAGACA 46
+
+Matrix = Unknown
+Transitions / transversions = 0.50 (3/6)
+Gap_init rate = 0.05 (2 / 43), avg. gap size = 1.00 (2 / 2)
+
+
+15 18.42 10.20 0.00 scaffold_1 4853 4901 (9250) (TC)n#Simple_repeat 1 54 (0) m_b1s252i3 4
+
+ scaffold_1 4853 TCTATTTTTCTCTCTCTCTCT-TCGGTCAGTTTCTCT-TCT-TCTC-CTC 4898
+ v i i - vv vv i - - -
+ (TC)n#Simple_ 1 TCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTC 50
+
+ scaffold_1 4899 -CTC 4901
+ -
+ (TC)n#Simple_ 51 TCTC 54
+
+Matrix = Unknown
+Transitions / transversions = 0.60 (3/5)
+Gap_init rate = 0.10 (5 / 48), avg. gap size = 1.00 (5 / 5)
+
+
+13 19.07 1.82 7.69 scaffold_1 6230 6284 (7867) (TAATTAA)n#Simple_repeat 1 52 (0) m_b1s252i4 5
+
+ scaffold_1 6230 TAATGAGT-ATTACTAATTAATAATTGGATGAGTTTATGAATTCATCATT 6278
+ v i - v -i - i v - v v
+ (TAATTAA)n#Si 1 TAATTAATAATTAATAATTAATAATT-AAT-AATTAAT-AATTAATAATT 47
+
+ scaffold_1 6279 AAATAA 6284
+ -
+ (TAATTAA)n#Si 48 -AATAA 52
+
+Matrix = Unknown
+Transitions / transversions = 0.60 (3/5)
+Gap_init rate = 0.09 (5 / 54), avg. gap size = 1.00 (5 / 5)
+
+
+15 28.31 0.00 3.51 scaffold_1 6548 6606 (7545) (GACA)n#Simple_repeat 1 57 (0) m_b1s252i5 6
+
+ scaffold_1 6548 GACAGAGAGATAAACAGACAGACATGGAAACAGAGGGACATAGAAAACAA 6597
+ v i i viv i vi v -v i -
+ (GACA)n#Simpl 1 GACAGACAGACAGACAGACAGACAGACAGACAGACAGACAGA-CAGAC-A 48
+
+ scaffold_1 6598 GACAGAGAG 6606
+ v
+ (GACA)n#Simpl 49 GACAGACAG 57
+
+Matrix = Unknown
+Transitions / transversions = 0.86 (6/7)
+Gap_init rate = 0.03 (2 / 58), avg. gap size = 1.00 (2 / 2)
+
+
+67 2.94 1.43 0.00 scaffold_1 11981 12050 (2170) (CT)n#Simple_repeat 1 71 (0) c_b1s251i0 7
+
+ scaffold_1 11981 CTCTCTCTCTCTCCCTCTCCCTCTC-CTCTCTCTCTCTCTCTCTCTCTCT 12029
+ i i -
+ (CT)n#Simple_ 1 CTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCT 50
+
+ scaffold_1 12030 CTCTCTCTCTCTCTCTCTCTC 12050
+
+ (CT)n#Simple_ 51 CTCTCTCTCTCTCTCTCTCTC 71
+
+Matrix = Unknown
+Transitions / transversions = 1.00 (2/0)
+Gap_init rate = 0.01 (1 / 69), avg. gap size = 1.00 (1 / 1)
+
+
+19 15.37 2.78 0.00 scaffold_1 12078 12113 (2107) (CT)n#Simple_repeat 1 37 (0) m_b1s252i6 8
+
+ scaffold_1 12078 CTCGCTCTCTCACTCTCTCCCTCTCTC-CCCACTCTC 12113
+ v v i - i v
+ (CT)n#Simple_ 1 CTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTC 37
+
+Matrix = Unknown
+Transitions / transversions = 0.67 (2/3)
+Gap_init rate = 0.03 (1 / 35), avg. gap size = 1.00 (1 / 1)
+
+
diff -r 5673e72241aa -r bdfc22c1c3e3 test-data/small.fasta.cat
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/small.fasta.cat Wed May 02 20:18:11 2018 -0400
@@ -0,0 +1,103 @@
+18 0.00 0.00 0.00 scaffold_1 613 632 (13519) (GT)n#Simple_repeat 1 20 (0) m_b1s252i0
+
+ scaffold_1 613 GTGTGTGTGTGTGTGTGTGT 632
+
+ (GT)n#Simple_ 1 GTGTGTGTGTGTGTGTGTGT 20
+
+Matrix = Unknown
+Transitions / transversions = 1.00 (0/0)
+Gap_init rate = 0.00 (0 / 19), avg. gap size = 0.0 (0 / 0)
+
+16 18.30 2.22 2.22 scaffold_1 780 824 (13327) (ATAATA)n#Simple_repeat 1 45 (0) m_b1s252i1
+
+ scaffold_1 780 ATATTAAT-ATACTAAATAATGATAATATTAATTCTAATAATGATA 824
+ v - v - i v vv i
+ (ATAATA)n#Sim 1 ATAATAATAATAAT-AATAATAATAATAATAATAATAATAATAATA 45
+
+Matrix = Unknown
+Transitions / transversions = 0.40 (2/5)
+Gap_init rate = 0.05 (2 / 44), avg. gap size = 1.00 (2 / 2)
+
+12 23.88 4.55 0.00 scaffold_1 2231 2274 (11877) (CAGA)n#Simple_repeat 1 46 (0) m_b1s252i2
+
+ scaffold_1 2231 CAGA-AAACAGTCAGCCAATCAGA-GGACAGACTCAGAGACAGACA 2274
+ - i v v iv -i vv v
+ (CAGA)n#Simpl 1 CAGACAGACAGACAGACAGACAGACAGACAGACAGACAGACAGACA 46
+
+Matrix = Unknown
+Transitions / transversions = 0.50 (3/6)
+Gap_init rate = 0.05 (2 / 43), avg. gap size = 1.00 (2 / 2)
+
+15 18.42 10.20 0.00 scaffold_1 4853 4901 (9250) (TC)n#Simple_repeat 1 54 (0) m_b1s252i3
+
+ scaffold_1 4853 TCTATTTTTCTCTCTCTCTCT-TCGGTCAGTTTCTCT-TCT-TCTC-CTC 4898
+ v i i - vv vv i - - -
+ (TC)n#Simple_ 1 TCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTC 50
+
+ scaffold_1 4899 -CTC 4901
+ -
+ (TC)n#Simple_ 51 TCTC 54
+
+Matrix = Unknown
+Transitions / transversions = 0.60 (3/5)
+Gap_init rate = 0.10 (5 / 48), avg. gap size = 1.00 (5 / 5)
+
+13 19.07 1.82 7.69 scaffold_1 6230 6284 (7867) (TAATTAA)n#Simple_repeat 1 52 (0) m_b1s252i4
+
+ scaffold_1 6230 TAATGAGT-ATTACTAATTAATAATTGGATGAGTTTATGAATTCATCATT 6278
+ v i - v -i - i v - v v
+ (TAATTAA)n#Si 1 TAATTAATAATTAATAATTAATAATT-AAT-AATTAAT-AATTAATAATT 47
+
+ scaffold_1 6279 AAATAA 6284
+ -
+ (TAATTAA)n#Si 48 -AATAA 52
+
+Matrix = Unknown
+Transitions / transversions = 0.60 (3/5)
+Gap_init rate = 0.09 (5 / 54), avg. gap size = 1.00 (5 / 5)
+
+15 28.31 0.00 3.51 scaffold_1 6548 6606 (7545) (GACA)n#Simple_repeat 1 57 (0) m_b1s252i5
+
+ scaffold_1 6548 GACAGAGAGATAAACAGACAGACATGGAAACAGAGGGACATAGAAAACAA 6597
+ v i i viv i vi v -v i -
+ (GACA)n#Simpl 1 GACAGACAGACAGACAGACAGACAGACAGACAGACAGACAGA-CAGAC-A 48
+
+ scaffold_1 6598 GACAGAGAG 6606
+ v
+ (GACA)n#Simpl 49 GACAGACAG 57
+
+Matrix = Unknown
+Transitions / transversions = 0.86 (6/7)
+Gap_init rate = 0.03 (2 / 58), avg. gap size = 1.00 (2 / 2)
+
+67 2.94 1.43 0.00 scaffold_1 11981 12050 (2170) (CT)n#Simple_repeat 1 71 (0) c_b1s251i0
+
+ scaffold_1 11981 CTCTCTCTCTCTCCCTCTCCCTCTC-CTCTCTCTCTCTCTCTCTCTCTCT 12029
+ i i -
+ (CT)n#Simple_ 1 CTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCT 50
+
+ scaffold_1 12030 CTCTCTCTCTCTCTCTCTCTC 12050
+
+ (CT)n#Simple_ 51 CTCTCTCTCTCTCTCTCTCTC 71
+
+Matrix = Unknown
+Transitions / transversions = 1.00 (2/0)
+Gap_init rate = 0.01 (1 / 69), avg. gap size = 1.00 (1 / 1)
+
+19 15.37 2.78 0.00 scaffold_1 12078 12113 (2107) (CT)n#Simple_repeat 1 37 (0) m_b1s252i6
+
+ scaffold_1 12078 CTCGCTCTCTCACTCTCTCCCTCTCTC-CCCACTCTC 12113
+ v v i - i v
+ (CT)n#Simple_ 1 CTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTCTC 37
+
+Matrix = Unknown
+Transitions / transversions = 0.67 (2/3)
+Gap_init rate = 0.03 (1 / 35), avg. gap size = 1.00 (1 / 1)
+
+## Total Sequences: 1
+## Total Length: 14220
+## Total NonMask ( excluding >20bp runs of N/X bases ): 14220
+## Total NonSub ( excluding all non ACGT bases ):14220
+RepeatMasker version open-4.0.7 , default mode
+run with rmblastn version 2.2.27+
+RepeatMasker Combined Database: Dfam_Consensus-20170127
diff -r 5673e72241aa -r bdfc22c1c3e3 test-data/small.fasta.gff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/small.fasta.gff Wed May 02 20:18:11 2018 -0400
@@ -0,0 +1,11 @@
+##gff-version 2
+##date 2018-04-21
+##sequence-region dataset_12.dat
+scaffold_1 RepeatMasker similarity 613 632 0.0 + . Target "Motif:(GT)n" 1 20
+scaffold_1 RepeatMasker similarity 780 824 18.3 + . Target "Motif:(ATAATA)n" 1 45
+scaffold_1 RepeatMasker similarity 2231 2274 23.9 + . Target "Motif:(CAGA)n" 1 46
+scaffold_1 RepeatMasker similarity 4853 4901 18.4 + . Target "Motif:(TC)n" 1 54
+scaffold_1 RepeatMasker similarity 6230 6284 19.1 + . Target "Motif:(TAATTAA)n" 1 52
+scaffold_1 RepeatMasker similarity 6548 6606 28.3 + . Target "Motif:(GACA)n" 1 57
+scaffold_1 RepeatMasker similarity 11981 12050 2.9 + . Target "Motif:(CT)n" 1 71
+scaffold_1 RepeatMasker similarity 12078 12113 15.4 + . Target "Motif:(CT)n" 1 37
diff -r 5673e72241aa -r bdfc22c1c3e3 test-data/small.fasta.log
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/small.fasta.log Wed May 02 20:18:11 2018 -0400
@@ -0,0 +1,10 @@
+SW score % div. % del. % ins. query sequence pos in query: begin end (left) repeat class/family pos in repeat: begin end (left) ID
+
+18 0.0 0.0 0.0 scaffold_1 613 632 (13588) (GT)n Simple_repeat 1 20 (0) 1
+16 18.3 2.2 2.2 scaffold_1 780 824 (13396) (ATAATA)n Simple_repeat 1 45 (0) 2
+12 23.9 4.5 0.0 scaffold_1 2231 2274 (11946) (CAGA)n Simple_repeat 1 46 (0) 3
+15 18.4 10.2 0.0 scaffold_1 4853 4901 (9319) (TC)n Simple_repeat 1 54 (0) 4
+13 19.1 1.8 7.7 scaffold_1 6230 6284 (7936) (TAATTAA)n Simple_repeat 1 52 (0) 5
+15 28.3 0.0 3.5 scaffold_1 6548 6606 (7614) (GACA)n Simple_repeat 1 57 (0) 6
+67 2.9 1.4 0.0 scaffold_1 11981 12050 (2170) (CT)n Simple_repeat 1 71 (0) 7
+19 15.4 2.8 0.0 scaffold_1 12078 12113 (2107) (CT)n Simple_repeat 1 37 (0) 8
diff -r 5673e72241aa -r bdfc22c1c3e3 test-data/small.fasta.masked
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/small.fasta.masked Wed May 02 20:18:11 2018 -0400
@@ -0,0 +1,286 @@
+>scaffold_1
+TGCTTTTCTGAGATTTATGTCAGCTCCCCATTGGGAGATACAGGAGAATC
+CAATATATTCCTGTCTCGCTTCTTTTATATTTATCCTTTCTACACCTGAC
+ATCCTCAGTGATTGAAGTGACAAAAAGTGGAGCGCACGCAGTGGTCATTA
+CCCTCCAATGGTACTTCTAATTAAGGAAAGATTTTTTGCATTCACTGAGC
+AAAACACTTATTTGCATGAATGGAAAATCATAAATGAGGGGTCCATTAAA
+CAAATTTCCTAATTGTTTGCTTTTTTTTCTTCCTACTTCACCATCCCTCT
+AAAGCTATTACTCTCTATTCTACCCCATTATCGAGTGCACAAACACCAGC
+CCCAAATTGTCTTATCTCTGCTTTGATAAATGATATTTTTTTCTCTTATA
+ATTGTGTTTCTCTCTAGATGTGCGGTGTCCATCAAGACACTGGATGTCAC
+GTGGTCACTCCTGTGAAGAGCGAACTGTGTGGAACCCGAAGTACTGTGTG
+GTTGCTGACTGTCAGATGCTGCTTCTGAATGAGGAGGAGGTGGTGAGAGC
+AGACAGCACAATCTCTTGTCTGGCATGTTCCTCTGTGTCACCATTGTCTC
+TCTCATCTGCTCNNNNNNNNNNNNNNNNNNNNCCTTGTCAATGTCATTAC
+ACAATTTATGTTGGTGCACTGCATGTCAGAGTCTGAACTTTGTTGGACAT
+CTACTTTCTGTCACCTGATACCTCATACTTTACACTCTAATCCCTTTTTC
+CTTTCTAACTGCTGCTGTGTTAAGCTGTCNNNNNNNNNNNNNNNNNNNNN
+NNNNNNNNNNNNNNNNNNNNNNNNGTGAATGGAGATTCACAATGAAGAAA
+CACAAGGTCCAGACTGAACCCCTGTGCTGTGTGAAGAGTTCACTCTACAT
+TTACATTCATCCCACATCAGAGACCAGCAATAGCCAGGTTAAGCAGAGCA
+AGGCTGAGTCTGGCTCTTTGCCTCTGTTGTTTTGATTAGTGTCACACTGG
+ATTATGCTAGTTTGTGTGAGATTAGAGGTCCTGTTGTTACGAGCAAATCA
+GCAGTCAGCAGGGTAATCTAAATTACATTGTTCTGTCGGCAATATCCTCT
+CCTCGCTCAACAGCTTTGTGTGAGCTCATATTTAAAGCCCCCACAGTAGT
+GCAGTGCATAAAATCATGCAGATACAGATCAGAAGCTTCAGGTAATGTTT
+ACATCAAACATCAGGGGGAAAATGTGATCTCAGTGCCTCTGACCGTGGTG
+TGATTGTTGGTGCCGGACAGGCTGGTTTGAGTATTTCTAAAACTGCTGAT
+CTCCTGGGATTTTCACACACGGCATTCTCTAGAGTTTACTCAGAACGGTG
+TGGAAAGCAAAAAAACATCCCGCGAGCTGCAATCCTGCGGATGGAAACAC
+CTTGTTGATGGGATATGTCAGAGGAATGGCCAGGCTGGATCAATCTGACA
+GAAAGGCGGTAACTCAGATAAGCACTCTCTACAACTGTGGTGAGCAGAAA
+AGCGTTCTCAGAATGCACAACACGTTCAACCTTGAGGAAGATGTTGCTAC
+AGCAGCAGATGAAGACCACGTCTGGTTCCACTCCTGTCAGCCAAGAACAT
+CTCAGACTGCACAGGACACCAAAACAAAAACACATCCTGTTTTCTACTGG
+TGGTAGAGTCACAATTTGGCAATAAGATAAATCCATGGACCCAACTTGCC
+TTGTGTCAATAGACCAAGCTGCTGGTGGTCTTGGGGAATGTTTTCTTTAC
+ACTTTCACACTATCGGCCTATATAAAATCCTATTATAAACTGCTGTACAG
+TGCATTGGGTTTGATAAGCCCTCTAAGTCTGTATATCATGATCTCATTGA
+TACCTGCGGCAATACACCCCCACAAACGCAGCTCCCTGCATTTTAAGTAT
+TATAGAGAGTAATTTCACTGTCCATGTCTTTTTTGATCATAAAGCAGGTC
+TAGGTGCTGTATACAACACTGTATTGAAATGCTGAAGCAGGTCTAGGTGC
+TGTATACAACACTGTATTGAAATGCTGAAGCCAATATATCAATCTATCTG
+TCTATATTTTATGAAATATCAGAGCATTTTAGTCCAAATTTGTCTGTTTT
+GTTCATTGCAATGCTGACTGCTTAACATTTTCCTCAGTGGTGGCCATCAC
+CACAGCATTTACTGGTGAGTTTTACCAAGCTACAGTGGGCCACAATGAGT
+TACCTGTTATTGGCCTGGCTCTATGGCATGNNNNNNNNNNNNNNNNNNNN
+NNNNNNNNNNNNNNNNNNNNNNNNCAAAGTGCCCTGTTCTTGTTAGAGCA
+GAGATAAATGAGACAGAGGAGATGTAAAACTATACTGAGATGGTTTTTTG
+GTTCTTAAAACCACAAATATATTGTATTACGGATATCAAAACTTCAAATA
+AAACCAGTAAAGTGTAAAACATGGGACCTCTAAATGAAGGGCTGTTTTGT
+TTCGTAGTTCTAGATTATGTCACTATGTGGCCTCGGTCTCTGTCTGCGTA
+AAGCGGCTACATGTAGAATTTGACCCACTTTGGTGCCCACATATGGTAAC
+TAAAACACTACAGACAGTATGCACTCCAACCCTATATAATTTATGTCCTT
+CAGTGAAGCCTACAAAATGTGCAGCATGATTTGCTATGATTAATACCTAG
+AATTATATTAAATTTTAGAAGTTTAGAGAGATGGCTTATACCTTTTTCTG
+AGCATGGAGTCATCTCATGTAATTTGTCACATACCTTTGGCCAGCTTAAA
+CCTGGTCATTCCAGTGAGAGCTGCTCACCCAAATGTTTCTGTATGCACCT
+CCTGCTGTGGGTGCCAATAGCTCATGCAAGTTGGTGTCTTTCAACTAAGG
+CCACTATGTGAGGACCATCAGCAGCAAATTAAATTAGAAGTGCCTTGGAG
+TTTCTCAGGCCCTCTTCTATGATCATTAAGGTCTCAGTGACAGAACAGTG
+CCCCTTTGAGGGACTATGGCATCTTGAGCACTTAAGTTGGCCGAATGTTT
+GATCTCAAATATGAGTGCACTGTTTCAAAGTCACAAAAGCCTCTGGACAA
+GGCATAGTTACTGGGCTTGGTTAACCTTTTTTTCATACCGGCGTGACTGC
+TGGAACTTGGAACATGTAGCCTAAGTTTCCCTTTGTCTGCAATTACTGAG
+GTATGCCATGTTGAAATAGAACAATAATTGCAGGGAGGAATTATTCCAAT
+CGACCCATCGGCAGGCTTTCCAATACAGTGCTTTTTGTTTCACAGCAACA
+AAGAACAAGAGCTTTTAAATGCATCCATCTGGACCCTGACTATGAAAGGT
+CATTGGTAACGCTGCTGGATTTCTGTTATGTCAGCAAACTGCAGGTCAAA
+GCGATGATACAGTCTTATAATGGCTTTCTCCAAGTGAAGGTGGGATAACA
+TGGTTTAAACAAGCTCAGTTAAATGGATCAGAGCATCAACTGCTGTGAAC
+AAGCAATCACACGGTCAAGGTCAAACATTTACACTTCTGAGAGATCTGGA
+GAGTATGTCATGGCAGTATTGCTTTTCAGTTATTTCAGTAACTGATTACG
+CCTTGTACTTAGTCTCAGAATTAGTGATTTGATTCAAAGTGTTTTATATA
+TGTATATTTCAAAGCAAAAATACAGCTTAGGTAAAGCTCCTTAGACTCAT
+GCAGCCTAATTTACTGTAGACATTCCTCCATGTACAGTACTGTGCAAATG
+TTTTAGGCAGTTTTAGGCACTAAAGGTGAACTGAGGATGCAGTCCCACGA
+TTAATTTTTATTCATCAGTTAACCTCATGTGAAGTGTAGTAAACAGAAAA
+AACCTAAATCAGATCAGTATTTCTTATGACCCCCCTCCCCTACCACCCAT
+CTTTAAAACAGCTCCAGTTCTCCTCAATCCCCCTGTACTTAGGTAGTTTT
+TTTCTAGCGTCTTGGAGAAGTTGCCTCAGTTCTTCTGTGGATTTTAGGCT
+GTCTCTGTGTCTTCTGTCTCCTCATGTATTCTCAGACTGACTCCATGATG
+TTGAGATCAGGGCTCTGTGGTGGGGGGGTCAGACCATCTGTTGCGGGACT
+CCTTGTTCTTCTTGTCTCTGAGGATAGTTCTTTATGATGCTGACTGTGTG
+ATTGGACTCATTGTCCTGCTGCAGAATTAATCTGGGACTGATCAGACATC
+TCCCTGATTGTACTGACAAAGGATAAGAGCAAAAACCTGTAGACTGCCTA
+AAACTTCTGCACAGTACTGCACAATACTGTATGTATGTGTGATAATACTC
+AGAAGTGATATAGAGTGGTTCAGGAGAAGCCTTAACTTACTTGTTCTTCT
+TTTCCCTATGATGCAATTTCTCTCCAAGCAAACAGTACATAATGAAATAT
+GTCTAAGAAAACACTAGCTGTTTGTCTTTTTGAAACACATTTAATAATTC
+AGATTTAGCCACAAATTAAAAATGAGCTTATACTTTGAACTTGCCCATTG
+GTTTTGATGTATGAAGCTGACAGATTTAGTCCACTGCATACTGCACTTTT
+TTGGATAGTGAAATAAATTAATTTATTATGCAGCATTTAAGCATATTGCT
+GTTATCTAGAATTTTATATATTAATAGGTATATATTATATTAACTCTTCA
+TTTGCTTAAATTTGGCCTGTATATTCCTCCATTTTATACAACCTTTAGAA
+AACACTGGAGTGAACAAAAATGTGAGGTTCAAAAGTGAGAGGAAAGAAAA
+ATCAGTGTGTGCAGCAAGACTGTAAGAGTCCCTGAACAAAAGTGTTGATT
+TATTGTTGGCTGTGAAAGTTTTTGCTGCAGGGGTTTTTGTAAACAGTGAC
+TCTTCTTTATGTCTTTGTTTCTATCTTTTTGTGTTTTCTTTTTTCATCTT
+ATNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNN
+NATACTCATGCTTCTCTTTTACTCTAATGGAAAACATAGAATTGAGGTGC
+AGTATCACTGAGAACAGCCAATGCTGATACTGTCATTTGTTATAGGATGT
+TTACTTAAGAAATGATTGTGGCCTTATTTGCCAAAGACGATTAGGCCCTG
+AGCCATTTGTACAGCCAATGTGACACCTCCGTAACCATAAGAAAAATTAT
+GCTTCCACAAACAGAAAGAGAGACAAATACAGACAGTGAAAGCAAAACTA
+TGAGAGAAGGGATAGCCATCTCAGCATTCAGCCAGTGTGTCACATGTCCA
+GAGGGCTGCAATATGAAGCCAATAAACTGAGAGAAAGGTGTGATTCCAGA
+GGGCTTTCCGGACTTTAAACTTTTCTCATTTTCACCTTCAGCTCGTTGTG
+AAGCCTTCAATTGTTCCTTGGTCACATGAAGCCCCCTGTGTGTAAAATTG
+ACATTCAGCTTATTACTCTCATCTACATCTCTAAAGTTGCACATGACTGC
+CAGTAGAGGGTGCTCATGATTTGAGACAAGTAACTTTTCTGTGCTTGTGT
+CAACAGTTAAAAATTCCCTATGGATACTTGAAAGAAATGCACCAGTGTTT
+AAATTTAGACTCAGTCCAAGTAGGCTTTGCCATTTGCTTTACTGTTGTAA
+TCAAATCAGTGCTCACAGTACATCAGTGGCAAAAGCAATTAGCTTAATTG
+AGTTAGTAGGGAGTGAAAAGATAGATCACTATTTCCTGGCAGCGATATAT
+TTTTCTCAGTTAACCTTCTCACAGAAAATTAGTTAGATGAGTTTCTTATC
+TCATTAGAACCATTGTTGTTTATTATTTAAACCTGACCTTTATCCAGAGA
+ATGTTTTTCACAGTAAGCATGTGTTTCACTCCAGCTCATACAGACACACC
+TTGTGGCCAGTCAGGGAATGTGCATTAAAACTAATGTTCTCTCTGGTAGA
+GCCATTCTGCCTATTCTGTTATTCACCAAAACTTTCCTGCCCAGATTTTT
+CCATCTAGTCAGGGGACTTTTTCCTCAGCTGAACTGTCAGTAGCCAGCTG
+CTCTGACCTTTACTCACCTCAGAGATTACTCATTCAAGTTATTTTACCAA
+TGATGGAATAAAGTGAATACACACATCGTGACTTCATCATACTTTCCCTC
+CTTTACCGTACTTTCCTAACATCAGTTAGCAAATTATACACTTAAATATG
+CTAAAATAGAGATTTGTTTCAAATTGAAGAGCAACACAGGACACATTTGC
+TTACACAAGTGACTCTATCTTATTTTTTAAGTGGCTGTCATCCTCAATAT
+CATCAATATTTTAGGCATGTGAATGTAGGNNNNNNNNNNNNNNNNNNNNN
+NNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNGATTATTATGATAAAG
+CTACACATTATACTGCAATTCCGGGCCAACACTATTGTTTCGCCCTTACA
+GTACAGGACTGTACATATCACTGTCACTACAAATTGTTTCAGTGAGGCTC
+AGATTACAGCTCATCTTGCTTAGTCATTACGGCTCAGACCACCAGACAAT
+GTCTTTACGTCAGAGAAAGTCTGAGTGAGAGCTGTCCTTAAAACCAAGTC
+CCATGAGGCAAGTAAAGAGGTGACTCGCTGAGAGGATCAGGGAGAGGNNN
+NNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNN
+NNNNNNGGTGCTGCATTGAGTCGAGAGGTGTGAGGATGTTCGATAAGCCA
+TTATCACTCTGCTCGGAGGACGTCAGGCCCTATCCTTTTTTCTTTGAGTC
+ACCACTTTCTCACCACAGCCATCCTTCTTCCTTTGTCTGTTTAATCTTTT
+GCAGCCAAACATTTGGTATGCAAACTATAGGAAGATATGGTCTGACACCG
+ACTGATGTGATGCTAATGCCTTCTCTGTTTTATCCAATGACTCCTCATTT
+ATCAGGACCAATCCAGCTATTGTGTGCTATTGGCCCAACACAGCATTAAA
+CATGGTGACCAGAATAGCCACAGCAAAATAAATAACGGGCCTCTGTGACT
+ATTGTATGTGCATTTCTTACAGCTGTCATTTTTCTTTTCTGTTAGCTTTC
+ATTCTACTGTGCGTGCTCTCTATCTGCCTACGTTGTATCTGTGCCTTTTG
+TTAAATTCATTCAGCCTTTTATCTGTCTTGAATTTCTTTCTCTGTGTCCT
+CCTTTCCCTCTCTGTCTCAGCAGATCCGTCCCTTGTTTTTGCAGGAGAAG
+CGCTCTGCGTCATGCAAGGTCCATCTTCTGCGACGCACCATCAGCGTTCC
+AGTGGAAACACAGTTTCCAGAACTCCATAGCCAGCTGTCCACTGAGAGCG
+GTGAGTAGCCTGAGGACATGCCTCTGCTGTGATTAGCATGCATCATTATT
+TCCATACACACACTGGAAATCTTTTAATCGTTTTTCTTGACACAATTTAA
+TTAATTTAAATAATTAATAACATTGAAATCAACTGTTAAACACTTGTTCA
+ACATGGTTGTGGACAAAATCATCATAATGACTGTGGAGACTAAGGAGAAA
+CAATGCTTTGTTAAAATCTTTGCTCTGGTTTTGGCTTTTTCTATATTCTA
+TTTGTGTGTGCAGTGCTGCTAAACATCATCTTAGTCAGAGTCAAACTTGA
+GCACTCATGCAGATGCTTGTTCTATTCAGTGGTCAAATGGGCAGTGTAGC
+TTAGGAGAAGCACTTCTTTCCGCTCCTCAGTGACATAACCAGTCACACAC
+TCACACAGGCAAGTGAGCCTTTTAAAATTGCTGATACTATTTTTTTCTAC
+TTCATATCCACTAGATGGAGAGCTTGGTGCTTTGTAGCACTCCAGTGTAC
+TTGGAATGTTTCATCATAACCACTAAGGCAGACATTGATAAAGGCTTCGG
+TCTCTTTCAAACTGCAGGTGTCATGTTGCACTCTCCCTATTGCTTTTATG
+AAAATGTAGTGCCGGTAATATAACACAGTTACTCTCTGCATATATCACTA
+TGTACACTTACTTCTATGGAAAAGATGGAGCGCCACAGTGAAAACTGTTT
+TGAGTCTGTGAGGGGAAAACACAGCATCAGTCACAGTGAAACACTAGGTG
+GCACTCAGGTTTGACATTCAAGCATTTGTATCCCACAGTTACTGTTGCTG
+GGTTGTTGGCTGGCATGCAACTTAATATGATCTATCTTTAAATCAGTGTG
+TGCAGTGGTTATTTAGTTTAAGTGCTTTTTAATGATGTCACAACATTATT
+TTGTCTACACCCTGCATACAGCACAGTATATTAAATTTAGGTTTTATTAA
+GTTAAGTAATGTTCTGAGGTGGCATTGCCCTCAGGTATATATCCCTCAGG
+CAGTGTTACTGGACAGCATATAGATTGTAATGTTGTGTAAGCAGTGTTGT
+GTAAGCTTTTTTAACCAAAATGCTCTCATGTTTCTTTGTTACCACAGTGG
+TTTTAGTGATGTTTTGTGCTGTGAACAGAATCATGATTTCTGCAGACACT
+CCACATCTGTTTAAACAGTGATTTTCACATCTGTCTGTAACTGAGTCAGT
+CAGTTTGTGGTTGGATTGATGTGTAGTGGGATCTACAGATCATCAACCCT
+CGGGGAAGCCATTTAGTTCTGTGTTAAATAAAAATACAACTTTTGAGCAC
+TGTTTTTTCATATTTTTCTTCATCCCTTAGTTGATATTAAAGGTGCTATA
+TGTAGATTTTTGCTATCACTACATAGCCAATGTTAGGATTAAGAACCCCA
+GCAACCCGAATGTTAACTCGTACTTTGCTTCTATTTCTATTACATATTTT
+CTTCTATGGAAGTTAGGATGTTAACCAGCTAACCCCAGGTCATCTCATAA
+TACCACTTGGCAATAGTCAGTCACTGTTGCATTCAGTCTGCCCCTCCAGC
+ATGAAAGGATGAAGAAGTACCGCTACCCAGAAGGCGTAGTCTAACCCCTT
+GTCTTGTAAACACAGCAATGGCTGAAGCTCTTGGTAAGTAAACAGCTGTT
+AATGTCAGTGTTGGCTACATAGCTAAAACTTACACATAGCACCGTTAAAA
+AAATAAATGGTAAGTTTTTGTCCTTTTAGTTAAAGCATGTAAATGTCAGT
+TAAAACAATTTAGAAAATTTCTCATTCAAATAGTCATTTTATTTTGTGTG
+CTATAAATACCTTCAGTTTTTTTTCTTGTACTTTATTTTAAACTCTTGTC
+TTTCTCTTATGCCCCTTATCTACCAGGAGAGGTCACACTCTTGTTGATAG
+CATGATAAGGAAATGAGCAGAGATGTCCTTATTTCTCCTCAAAGTTATTC
+CCTGCATAGCACATATTTGACTTTAAAAATACAAAGACTACAGGTGCTAA
+ATCACACACACAACACCCAAAAGAATAGAGGACTTTTAAATATGTGCATC
+CCATTTTCTAATCTATATTCACCACTGATACAAGTGATGACACGGTGATG
+AGAAAATAACGTAACATACATTATTATACAAGATTGGTATGATTGCTGTA
+GGTTGGTTTTGTTTATCTGAGAAGGGACAGAGGCTAAAAGAATAAACAAA
+GTCTGCCAGCTACTTCACTAATTACAGAGTACCCCTGCAACTCTGCCAAT
+GACATTCTGAAACTTTTCCATGACTATTATGTAAGATAATTTTTGAATCA
+CTGATTCAGATTTCCATAGCCAAGATACACTATTCTGCATGTTGGCTAGA
+ATACATTACAATACATTAATATATTACTGTAGTGGTTATTATGTCAGCCA
+TTTAAACATAATTTCATACTTTCAGCTGTTCGCAGGGCAAACTTTTTATT
+TTTGTCACCTGAATCCAGTTGCATTTGGATTTGAATTCAGTGGTGACTGC
+CAATGAAAAATAACTCACAGGGGCACTTAGAGATCTGAGGCGGCATTGAC
+TGAACATCGAAGGGCTACTATTACAGAAATGCAAGTGGAAAAAGAATCTG
+ATATGATACTTGCCAGTATGAAAAGCATAATTAGGACTTTAAATGCATGT
+TTTAAATGTTTTTGTGAACCATAATTTCAGTGTAAAAGTTCCAGTTATAT
+TTTAAAAGGAACTCCAAATATCCAGTGGTAGCATCAAGGTAACCTGAGAT
+AAGTGAAAAGTAATTCTAAATTAATCAGTATGTTGAAATATCAGACATTT
+GTGTGCATTATTGTTAGTGTGACCATGGTGGGATACTTCAAACACACTTG
+TTCATTGGCAAAATAATTGTCACATGAATTAACACAAGTGACACTTTCAG
+TATCATACTGACAGAATGTTTGTTGTTAACTTTATCCCTGAAAACAAACA
+CTAATACATGTTCTTGTCGCCCCTTCAGTGCCTAACCTTTAAAATTGTGC
+TTGTGAGTGTGTGTATGTGAGCGCACCTGTATGGTTTTCAAATAATGTTC
+CACATCACAACACTACAAACACTCACATGGTCTATGTTTTACTAAATTAT
+TCATTGGCGTAGGCCCCACCTGCTCTTGTCCTTGTGTGACACAGGCTCTA
+AATAAGCAGCATGATGAATAAAAATGACACTGAGATGAATAGGAATCCAC
+AGCAAATCAGAGAGCACTCTCATCTCGTCTCATCCTCCGACTGAATAGCG
+AGCGGCTGCCTCCTTTATTCTTTTGAACTCTTCGCGGTTTTGGCACAAAC
+ATGCCAGAGACAGAGAGCGCTGTTACGCTCCCACCAGAGCAACTACGCTT
+AATTTTACTGAGGTGAAAGTTTTTTTTTTTTTTCTGGATAAAGCTTTGGA
+AAAGTTCTCAACTGTTGCTTCTTTAAAGATGCTGGGGCATATTCTGCCCT
+ATTTTCCAGTTTTTTACATCTCCCATAAATATTTTCACAAGCTGTAACAT
+TTTAGACAGGATTAAATTGAACTAGATAACTGACCAAAGGCTGCTAAATT
+ATTTTTATGTGCCTTGTAGCACAAATACTGTCTCACATATATTTTAAGTA
+TCTTAATATTCCCTCTGATGTTTAATTTAACAAAGCTGTCCTTCCCTCCA
+TCTCTCTCCTCATAGTTTTTCATTACAATTAGCTCTCATTAGATAGAATT
+GTATTTGTTGTCTTTGTGCCAGTCACTCCAGTCTATTTTGCCAGCACACA
+ACTAAATAATTGTTTTGCCTTGTCAGTGTCTTGTTTTACAGTTTTAATGA
+TGAGCCCAAAACATGTCAAATATGAGGAACTATAACTTATCAAGAAAGTG
+GGGTAGTTGAGATAAAACTGTTTCCGAGGTGGAGGTTGGCTGAGCTCCAT
+TTGGCCACAAAATGTAGCTGAAAGGGCAGAGAAACCCACTTTAATGGAGT
+ACAGGTTGCATATGAGCTGGTAGGAAAGATATAGAATCATTATCAGCTGA
+TAATCTAACAGTAGCAGTCAGTGTAGATGCTGTGCTAACGCAAAGTTGTG
+AAACTACTGTCTGTAAGCAACTCATCCAATTGTTATTGCTGCCAAGCTTA
+AGTATTTTAACAGCTTTTAGGTGTTGTTAGCACAGTACTCGTTTGGATCC
+GGCCATGACAAGAAATCTTTATCGGCCACTAATTTAATTAATCATCTTTT
+TTCAAGCAAAAATCACAAACTTTCTTTGGTTCCACTTTTTCTCATTGTAG
+ATTAAATATCTTTTGGGTTTTGGCACAGGCTGGACAAAAAAACCTCTGAG
+ACGCTGTGATAAGAATTTATTTTCACATTTTTTTTACTTTTCAGGGACTA
+CACAATTATTTGGTGATGAAAATAATATTTTGTTGCAGCCCAAATGTTAA
+CTTGCCACTCAAGCTGTCAATTCAAGAAGGCAAAAGCAACAAATACTGCT
+TTGCCGAGCTGAAATGAGAGTAGAAACCATGCCCGGGCCAGCTCAGCCTG
+GTCAGGTTTTTGAGTCCATCTATTGTTAACATTCAGGTTGCAGCACAAGG
+GAAGTTCCTAAATTCTTCTGGCATGTTAATGTTTTCCAAACTGATGTTAC
+CAAGTCCTCGTTATGATGAGAAAAAAATATGCTGAGAGTGAAATTGATCA
+AAGTGGAAACATTAAGCACTGCCACAGTCCCCTCCACCCATCTTTCTCCC
+TCTCTCTCCACCGCAACGTGGAAACTGCTCNNNNNNNNNNNNNNNNNNNN
+NNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNN
+CTCCCTCCCATTCTGTGCTCCGGTATANNNNNNNNNNNNNNNNNNNNNNN
+NNNNNNNNNNNNNCAGAGAGGGGTTCAGTCAGACAGATGTAACACAGCAG
+TAGAAGCCTGAGCTGAGCTGGCAGGCTGCGGAGGCCAGACCAGAGCCAGC
+AGCTCTGACTGGAGAGAACAGCGAAGAGGTGACGGCAGCAGCGGCAGCAC
+AGGGGATAAAACAGTAGTTGTAGTAGCAGTTTCAGTAGTTGTACTTCAGT
+TACAGAGCTGACTTTACCTCAGGATATGGGTGTGTTGATCTGGGCGCTCA
+TCACCCTGTGAATTTAACATGGACCCTGACACCAGCACCCATCCAGAGAC
+ACAACATGGTGAGTGAGATTTGAAGGAGGAAAAGATTAGAAACAATGAGA
+GTGATACTGTGGGAAAAGTTGAGGAGCGTGTTAGTGAACAAGGGAGTCAG
+GTCACATGGTTTTCCCGTTAGGGTTGCTATTATGACTAGGCTCTCCATTT
+GGCTCTAAAGCTGTTGACTAGGGCCTCTGTGGTCAAATGAATAGGACTTC
+AGTCTGTTCTGTTGAGTAGGGGGTGAAGGGGTGAGGGGTGTTACATGGCA
+ATGTGATGAAATCAACTGCCTGCTTAAGACATTTTGCTCTAATGACCCTC
+TTGTCATTACTTTAACAGGGTTGTAAAGTTTTTTTTGCTTTTTTGTAGCT
+AAGAAAGTTGAGAATTGTTTTGTCTGAACTCTCTCTGGGATTTGTCTTGT
+CGGTTTTTGGCTGGTTTTTGGTGTGAGCTTCACAGAGCAGGAAGCTCTCC
+TCCTGCTCTTTGAATGGAATAATTAACTGTGAGGGCCGTGGGTGTACCAT
+TTCTGCTCAAAAGCAGCAAGATAATTTGATGGTTATGTGAATCTGTATAT
+TTGTATGCTGTGTAGTGGTGCTGCATGTGGGTGTTTGTGTTAGAGACACA
+GAGGGGCACCAAAGAATGAAAGTGGGAGACAGAGGGAACGAGAAGGGGAG
+AGACCGAGAGAGAAGGACTTATGTACACAAATAAATCCAGGGGGATCTAG
+ACTGCACTGTAGGCCAGTGCGAATGCTCACTCTTTCTCTTCCCCCTCATT
+TTCCGCTGCCTCTTTTTTTTCCTCCACTGCTCCAAATGTTGGAGCCCAAA
+CTAGATAGTTAAAAGGCAGAAAAAAATGGTGTGTTATTAACTGGGCCAGA
+AAAGACGATGTTTTGTCTTCATGGCCGATGGGAAGGACTCTGCTGTGCTG
+CTGATGAAGAATGTGGTTAACAGAATGAGTCAACAGAGAACATATTTCCA
+AGAGACTGTAGTTTCTCTTCGCCAGCGTCTAAGCCACATTGCTTTATGCA
+CTGGGCTCTCTGCCATGACGGCGAAGGAGAGACAAAGAGAGGGGAAAGAG
+AATCGCTAAAGATAAAACTCTGTTTTTATCCATCTCCTGAGACACAAAAC
+TTCTGTTAGCAATCTAACCAAATAAGCGAGAACATTAAGCTTCTTCTCAC
+CTTCCCAAAATAAAATGTCAACTTCATGCAGTAATACTCACTCTCTTCTC
+TCAACCAGTCAGCCAGCCTCTTTCAGTGCATACAGCTTGAGGAGATCCCT
+TCTAAAGGTCCAATATAAATAGAAAAGTGGGAGTAGAAAGGGCAATAATC
+TGATATCATCTGATTACATTCACACCTCAGGCTTGCACGCTACAGGAAGA
+GTTCACGCTTCCCAAGGCTTGCAGGCATCACTTTTCACTCATTCTCAGAT
+AGACACACAAACACATGCACAGAAATATCATTGCTGTTGTTTGCAACAAA
+TCCTGGAGTAGACTACTTTGCATTGAATTTCTATATGCATGTGTTTTCAT
+ATATTACACATTGCTTTTTGTACTTTGCATATAAAGTAGATGCTGATCTG
+CTATCTGCATATATAGTAGCTGCAGATAGCACTGTAACTACATCTACATA
+TTTCTTGTTTGTATCTACATCAAGCAGATAGTTGCTGATGCTGGACAACC
+TCTTCCGATATTCATTATTTTGGAAAAAAAAATATCAATGGCATTCCTAC
+CTTACAACTTAAATTAAAAGTGGTCACTTGAGTAACTGCAGAACATGTGT
+TCACCCAATAGTTTTTTTTAGAGAGTGTCACTCAAAGTATTCCTCCTTAC
+AAGCACCCATGCCTAAATCA
diff -r 5673e72241aa -r bdfc22c1c3e3 test-data/small.fasta.poly
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/small.fasta.poly Wed May 02 20:18:11 2018 -0400
@@ -0,0 +1,2 @@
+18 0.0 0.0 0.0 scaffold_1 613 632 (13588) (GT)n Simple_repeat 1 20 (0)
+67 2.9 1.4 0.0 scaffold_1 11981 12050 (2170) (CT)n Simple_repeat 1 71 (0)
diff -r 5673e72241aa -r bdfc22c1c3e3 test-data/small.fasta.stats
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/small.fasta.stats Wed May 02 20:18:11 2018 -0400
@@ -0,0 +1,51 @@
+==================================================
+file name: dataset_12.dat
+sequences: 1
+total length: 14220 bp (14220 bp excl N/X-runs)
+GC level: 39.94 %
+bases masked: 378 bp ( 2.66 %)
+==================================================
+ number of length percentage
+ elements* occupied of sequence
+--------------------------------------------------
+SINEs: 0 0 bp 0.00 %
+ ALUs 0 0 bp 0.00 %
+ MIRs 0 0 bp 0.00 %
+
+LINEs: 0 0 bp 0.00 %
+ LINE1 0 0 bp 0.00 %
+ LINE2 0 0 bp 0.00 %
+ L3/CR1 0 0 bp 0.00 %
+
+LTR elements: 0 0 bp 0.00 %
+ ERVL 0 0 bp 0.00 %
+ ERVL-MaLRs 0 0 bp 0.00 %
+ ERV_classI 0 0 bp 0.00 %
+ ERV_classII 0 0 bp 0.00 %
+
+DNA elements: 0 0 bp 0.00 %
+ hAT-Charlie 0 0 bp 0.00 %
+ TcMar-Tigger 0 0 bp 0.00 %
+
+Unclassified: 0 0 bp 0.00 %
+
+Total interspersed repeats: 0 bp 0.00 %
+
+
+Small RNA: 0 0 bp 0.00 %
+
+Satellites: 0 0 bp 0.00 %
+Simple repeats: 8 378 bp 2.66 %
+Low complexity: 0 0 bp 0.00 %
+==================================================
+
+* most repeats fragmented by insertions or deletions
+ have been counted as one element
+
+
+The query species was assumed to be homo
+RepeatMasker Combined Database: Dfam_Consensus-20170127
+
+run with rmblastn version 2.2.27+
+The query was compared to unclassified sequences in ".../dataset_2.dat"
+