changeset 0:fc30c955f2ac draft default tip

planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/main/tools/vgp_processcuration commit c25e877636f68656a0005883efb0f03b5ffd6b0c
author iuc
date Wed, 07 Jan 2026 12:48:27 +0000
parents
children
files macros.xml split_agp.xml test-data/expected_corrected.agp test-data/expected_hap1.agp test-data/expected_hap1_chr_level.fa test-data/expected_hap1_haplotigs.agp test-data/expected_hap1_inter_chr.tsv test-data/expected_hap1_unlocs_no_hapdups.agp test-data/expected_hap2.agp test-data/expected_hap2_haplotigs.agp test-data/expected_hap2_inter_chr.tsv test-data/expected_hap2_unlocs_no_hapdups.agp test-data/expected_orientation.tsv test-data/expected_reversing_renaming.sak test-data/test_hap1_sorted.fa test-data/test_hap1_unlocs_no_hapdups.agp test-data/test_input.agp test-data/test_input.fasta.gz test-data/test_mashmap.out
diffstat 17 files changed, 512 insertions(+), 0 deletions(-) [+]
line wrap: on
line diff
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/macros.xml	Wed Jan 07 12:48:27 2026 +0000
@@ -0,0 +1,56 @@
+<macros>
+    <xml name="requirements">
+        <requirements>
+            <requirement type="package" version="@TOOL_VERSION@">vgp-processcuration</requirement>
+            <yield/>
+        </requirements>
+    </xml>
+    <token name="@TOOL_VERSION@">1.0</token>
+    <token name="@PROFILE@">21.09</token>
+    <xml name="edam_ontology">
+        <edam_topics>
+            <edam_topic>topic_0622</edam_topic> <!-- Genomics -->
+            <edam_topic>topic_3797</edam_topic> <!-- Genome assembly -->
+        </edam_topics>
+    </xml>
+    <xml name="xrefs">
+        <xrefs>
+            <xref type="bio.tools">vgp-processcuration</xref>
+        </xrefs>
+    </xml>
+    <xml name="citations">
+        <citations>
+            <citation type="bibtex">
+@misc{vgl_curation,
+    author = {VGL-Hub},
+    title = {VGL Curation - ProcessCuration toolkit for genome assembly submission},
+    year = {2025},
+    url = {https://github.com/vgl-hub/vgl-curation},
+}
+            </citation>
+        </citations>
+    </xml>
+    <xml name="help_common">
+        <![CDATA[
+**About ProcessCuration**
+
+ProcessCuration is a Python-based toolkit designed to process manually curated genome assemblies for submission.
+It reconciles AGP files (A Golden Path) created in PretextView with genome assembly FASTAs, preparing them for
+database submission through renaming, reorienting, and sorting operations.
+
+The toolkit is part of the VGP (Vertebrate Genomes Project) curation pipeline and works in conjunction with
+tools like gfastats and MashMap.
+
+**Input Naming Convention**
+
+Scaffolds must follow the naming pattern before curation:
+- Haplotype 1: H1.scaffold_X
+- Haplotype 2: H2.scaffold_X
+
+**More Information**
+
+- GitHub repository: https://github.com/vgl-hub/vgl-curation
+- VGP Genome Assembly Pipeline: https://vertebrategenomesproject.org/
+        ]]>
+    </xml>
+</macros>
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/split_agp.xml	Wed Jan 07 12:48:27 2026 +0000
@@ -0,0 +1,100 @@
+<tool id="vgp_split_agp" name="VGP Split AGP" version="@TOOL_VERSION@+galaxy0" profile="@PROFILE@">
+    <description>Correct AGP files and split haplotypes</description>
+    <macros>
+        <import>macros.xml</import>
+    </macros>
+    <expand macro="xrefs"/>
+    <expand macro="requirements"/>
+    <command detect_errors="exit_code"><![CDATA[
+        split_agp
+            -f '$fasta'
+            -a '$agp'
+            -o './'
+    ]]></command>
+    <inputs>
+        <param name="fasta" type="data" format="fasta,fasta.gz" label="Assembly FASTA file"
+            help="Input assembly FASTA file containing both haplotypes." />
+        <param name="agp" type="data" format="tabular" label="Curated AGP file"
+            help="Input curated AGP file created in PretextView with haplotype markers (Hap_1/H1 and Hap_2/H2)." />
+    </inputs>
+    <outputs>
+        <data name="corrected_agp" format="tabular" from_work_dir="corrected.agp"
+            label="${tool.name} on ${on_string}: Corrected AGP"/>
+
+        <!-- Haplotype 1 outputs -->
+        <data name="hap1_agp" format="tabular" from_work_dir="Hap_1/hap1.agp" label="${tool.name} on ${on_string}: Hap1 AGP"/>
+        <data name="hap1_unlocs_no_hapdups" format="tabular" from_work_dir="Hap_1/hap.unlocs.no_hapdups.agp" label="${tool.name} on ${on_string}: Hap1 Unlocs without haplotig AGP"/>
+        <data name="hap1_haplotigs" format="tabular" from_work_dir="Hap_1/haplotigs.agp" label="${tool.name} on ${on_string}: Hap1 Haplotigs AGP"/>
+
+        <!-- Haplotype 2 outputs -->
+        <data name="hap2_agp" format="tabular" from_work_dir="Hap_2/hap2.agp" label="${tool.name} on ${on_string}: Hap2 AGP"/>
+        <data name="hap2_unlocs_no_hapdups" format="tabular" from_work_dir="Hap_2/hap.unlocs.no_hapdups.agp" label="${tool.name} on ${on_string}: Hap2 Unlocs without haplotigs AGP"/>
+        <data name="hap2_haplotigs" format="tabular" from_work_dir="Hap_2/haplotigs.agp" label="${tool.name} on ${on_string}: Hap2 Haplotigs AGP"/>
+    </outputs>
+    <tests>
+        <test expect_num_outputs="7">
+            <param name="fasta" value="test_input.fasta.gz" ftype="fasta.gz"/>
+            <param name="agp" value="test_input.agp" ftype="tabular"/>
+            <output name="corrected_agp" file="expected_corrected.agp" ftype="tabular"/>
+            <output name="hap1_agp" file="expected_hap1.agp" ftype="tabular"/>
+            <output name="hap1_unlocs_no_hapdups" file="expected_hap1_unlocs_no_hapdups.agp" ftype="tabular"/>
+            <output name="hap1_haplotigs" file="expected_hap1_haplotigs.agp" ftype="tabular"/>
+            <output name="hap2_agp" file="expected_hap2.agp" ftype="tabular"/>
+            <output name="hap2_unlocs_no_hapdups" file="expected_hap2_unlocs_no_hapdups.agp" ftype="tabular"/>
+            <output name="hap2_haplotigs" file="expected_hap2_haplotigs.agp" ftype="tabular"/>
+        </test>
+    </tests>
+    <help><![CDATA[
+**What it does**
+
+split_agp corrects AGP files for sequence length discrepancies, splits haplotypes into separate files,
+assigns unlocalized sequences, and removes haplotig duplications.
+
+This tool performs three sequential operations:
+
+1. **AGPcorrect**: Validates sequence lengths from FASTA against AGP coordinates, adjusting start/end positions
+2. **hap_split**: Segregates lines containing haplotype markers into separate directories (Hap_1 and Hap_2)
+3. **unloc**: Processes metadata tags, renames unloc scaffolds with sequential numbering, removes haplotigs
+
+**Inputs**
+
+- **Assembly FASTA file**: FASTA file containing both haplotypes (may be gzip-compressed)
+- **Curated AGP file**: Tab-delimited AGP file with haplotype markers (Hap_1/H1 or Hap_2/H2)
+
+**Outputs**
+
+- **Corrected AGP**: Length-validated AGP file with corrected coordinates
+- **Hap1 AGP**: Haplotype 1 AGP file
+- **Hap1 Unlocs No Hapdups**: Haplotype 1 AGP with unlocalized sequences assigned and haplotigs removed
+- **Hap1 Haplotigs**: Removed duplicate haplotigs from Haplotype 1
+- **Hap2 AGP**: Haplotype 2 AGP file
+- **Hap2 Unlocs No Hapdups**: Haplotype 2 AGP with unlocalized sequences assigned and haplotigs removed
+- **Hap2 Haplotigs**: Removed duplicate haplotigs from Haplotype 2
+
+**Input Naming Requirements**
+
+⚠️ **Important**: Scaffolds in the input FASTA must follow this naming convention:
+- Haplotype 1: H1.scaffold_X
+- Haplotype 2: H2.scaffold_X
+
+This naming pattern is required before manual curation in PretextView.
+
+**Next Steps**
+
+After running split_agp, use the gfastats tool to sort each haplotype:
+
+1. Sort Haplotype 1: gfastats with Hap1 Unlocs No Hapdups AGP
+2. Sort Haplotype 2: gfastats with Hap2 Unlocs No Hapdups AGP
+
+Then proceed to the chromosome_assignment tool to assign chromosome-level names.
+
+.. class:: infomark
+
+**More Information**
+
+This tool is part of the VGP ProcessCuration pipeline for preparing curated genome assemblies for submission.
+
+<expand macro="help_common"/>
+    ]]></help>
+    <expand macro="citations"/>
+</tool>
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/expected_corrected.agp	Wed Jan 07 12:48:27 2026 +0000
@@ -0,0 +1,4 @@
+Scaffold_33	1	4414	1	W	scaffold_16.hap1	1	4414	+	Painted	Hap_1	
+Scaffold_34	1	4303	1	W	scaffold_17.hap2	1	4303	+	Painted	Hap_2	
+Scaffold_35	1	4409	1	W	scaffold_17.hap1	1	4409	+	Painted	Hap_1	
+Scaffold_36	1	4299	1	W	scaffold_16.hap2	1	4299	+	Painted	Hap_2	
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/expected_hap1.agp	Wed Jan 07 12:48:27 2026 +0000
@@ -0,0 +1,2 @@
+Scaffold_33	1	4414	1	W	scaffold_16.hap1	1	4414	+	Painted	Hap_1	
+Scaffold_35	1	4409	1	W	scaffold_17.hap1	1	4409	+	Painted	Hap_1	
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/expected_hap1_chr_level.fa	Wed Jan 07 12:48:27 2026 +0000
@@ -0,0 +1,310 @@
+>SUPER_1
+CCCACACCCACCCCACCCCACCCCCACCCCCACCCCCCACACCCCACCCCACCCCACCCC
+CACCCCTACCCCCCCACCCCCAACCCACCCCCACCCACCCACCCCTCACCCCACCCTACC
+CCCAACCCCTCCCCCACCCCACCCAACCCACCCCTACCCTAACCCTAACCCTAACCCTAC
+CCCTAACCTACCCTACCCTACCCTACCCACCCTAACCCTACCCTAACCCTAACCCTAACC
+CCTAACCCTAACCCTACCCTAACCCTAACCCTAACCCTAACCCTACCCCTAACCCTAACC
+CTAACCCTAACCCTAACCCTACCCCTAACCCTAACCCTAACCCTACCCAACCCTACCCTA
+ACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTA
+ACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTA
+ACCCCCTAACCCTAACCCTAACCCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACC
+CTAACCCTAACCCTAACCCTAACCCTAACCCTACCCTAACCCTAACCCTAACCCTAACCC
+TAACCCTACCCTAACCCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCC
+CTAACCCTAACCCTAACCCTAACCCTAACCCTACCCTAACCCTAACCCTAACCCTAACCC
+TAACCCTAACCCTAAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACC
+CTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACC
+CCCTAACCCTAACCCTAACCCTACCCTACCCTAACCCTAACCCTAACCCTAACCCCTAAC
+CCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCCTAACCCTAACCCTAA
+CCCTAACCCTAACCCTAACCCTACCCTAACCCTAACCCTAACCCTAACCCCCCCCCCCTA
+ACCCTACCCTAACCCCTAACCCTACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAA
+CCCTAACCCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCCC
+CTAACCCCTAACCCTACCCTAACCCTAACCCTAACCCTAACCCTACCCTAACCCTACCCT
+AACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCCTAACCC
+TAACCCTACCCTAACCCTAACCCCTAACCCTAACCCTAACCCTAACCCCTAACCCACTCG
+CCAGGAATACTGGGGCCGGGGGGACAGGCGGTATGCGGGTTGGATGGACCGTGCACCTTC
+CTTCCCTGCTTGGGGAGGGACTCGGACCCGATTCCCTAACCCTAACCCTAACCCTTAATC
+TAACCCTAACCCCCCTAACCCTAACCCGCCACTGACACTAACCCTCTCCCTGACACTAAC
+CCTGACCATAACCACTTACTACCCACTTGCCAAACCATAACCCTTACCTTTGCCTAAGGT
+TACTACCCACAAGGGTTACCATTTTCAGACATCGGAAGGGGGGTCCAAACCACTCGGGGG
+ACCATGAAACGTGCTCCTACACACTTTCTGGGGGACACTTTTGGCCTTTGCCCAAGCGTA
+ACCCTTACCTTTGCCTACCTTTACTACCCACAAGGTTTACCATTTTCATACATTCAAAGG
+GGGGTCCAAACGACTCAGGGGGCTCTGAAACGTGCTCCTAGACACTTTCTGGGGGACACT
+TTTGGGCTATGCCACTTTGTCATATTATCACACTTTTCCATATTCCCATACACATACATG
+GGAATATTAATATGGCCATAACTTTTGAACGGAACATCACAGAGCTTCAGGACCACCACC
+GTTGGACTCAGGGTACATCAAATAGGGGGGGTAGACAAACTTTCAACCTTCTAGCTCCAA
+AAAAAATCTTCAGCATTTTTGCTGACATCAGCCTTTTCACCCTTAATCTACCCCCCCCGC
+ACCCCCCCCAACGCCGCCACTGACACTAACCCTCTCCCTGACACTAACCCTGACCATAAC
+CACTTACTACCCACTTGCCAAACCGTAACCCTTACCTTTGCCTAAGGTTACTACCCACAA
+GGGTTACCATTTTCAGACATCGGAAGGGGGGTCCAAACCACTCGGGGGACCATGAAACGT
+GCTCCTACACACTTTCTGGGGGACACTTTTGGCCTTTGCCCAAGCGTAACCCTTACCTTT
+GCCTACCTTTACTACCCACAAGCTTTACCATTTTCATACATCGGAAGGGGGGTCCAAACC
+ACTCGGGGGACCATGAAACGTGCTCCTACACACTTTCTGGGGGACACTTTTGGGCTATGG
+CACTTTGTCATATTATCACACTTTTCCATATTCCCATACACATACATGGGAATATTAATA
+TGGCCATAACTTTTGAACGGAACATCACAGAGCTTCAGGACCACCACCGTTGGACTCAGG
+GTACATCAAATAGGGGGGGTAGACAAACTTTCAACCTTCTAGCTCCAAATAAAAAGTTCG
+GCAACTTTTGCCGAATCAGCCTTTTCACCCTTAATCTAACCCTAACCCCTAACCCCTAAC
+CCTAACCCTAACCCCCCCCCCTAACCCTAACCCTAACCCTAACCCCCTAACCCAAAAACA
+GTACTAAACTTAAAGAACTACAAACAAACTATGTATCCCTGGACTGGGTGGCGTAGGGAC
+TGGTGTCCCCAACGCACTCGCCAGGAATACTGGGGCCGGGGGGACAGGCGGTATGCGGGT
+TGGATGGACCGTGCACCTTCCTTCCCTGCTTGGGGAGGGACTCGGACCCGATTCCCTAAC
+CCTAACCCTAACCCTTAATCTAACCCTAACCCCCCTAACCCTAACCCGCCACTGACACTA
+ACCCTCTCCCTGACACTAACCCTGACCATAACCACTTACTACCCACTTGCCAAACCATAA
+CCCTTACCTTTGCCTAAGGTTACTACCCACAAGGGTTACCATTTTCAGACATCGGAAGGG
+GGGTCCAAACCACTCGGGGGACCATGAAACGTGCTCCTACACACTTTCTGGGGGACACTT
+TTGGCCTTTGCCCAAGCGTAACCCTTACCTTTGCCTACCTTTACTACCCACAAGGTTTAC
+CATTTTCATACATTCAAAGGGGGGTCCAAACGACTCAGGGGGCTCTGAAACGTGCTCCTA
+GACACTTTCTGGGGGACACTTTTGGGCTATGCCACTTTGTCATATTATCACACTTTTCCA
+TATTCCCATACACATACATGGGAATATTAATATGGCCATAACTTTTGAACGGAACATCAC
+AGAGCTTCAGGACCACCACCGTTGGACTCAGGGTACATCAAATAGGGGGGGTAGACAAAC
+TTTCAACCTTCTAGCTCCAAAAAAAATCTTCAGCATTTTTGCTGACATCAGCCTTTTCAC
+CCTTAATCTACCCCCCCCGCACCCCCCCCAACGCCGCCACTGACACTAACCCTCTCCCTG
+ACACTAACCCTGACCATAACCACTTACTACCCACTTGCCAAACCGTAACCCTTACCTTTG
+CCTAAGGTTACTACCCACAAGGGTTACCATTTTCAGACATCGGAAGGGGGGTCCAAACCA
+CTCGGGGGACCATGAAACGTGCTCCTACACACTTTCTGGGGGACACTTTTGGCCTTTGCC
+CAAGCGTAACCCTTACCTTTGCCTACCTTTACTACCCACAAGCTTTACCATTTTCATACA
+TCGGAAGGGGGGTCCAAACCACTCGGGGGACCATGAAACGTGCTCCTACACACTTTCTGG
+GGGACACTTTTGGGCTATGGCACTTTGTCATATTATCACACTTTTCCATATTCCCATACA
+CATACATGGGAATATTAATATGGCCATAACTTTTGAACGGAACATCACAGAGCTTCAGGA
+CCACCACCGTTGGACTCAGGGTACATCAAATAGGGGGGGTAGACAAACTTTCAACCTTCT
+AGCTCCAAATAAAAAGTTCGGCAACTTTTGCCGAATCAGCCTTTTCACCCTTAATCTAAC
+CCTACCCTAACTTTTGCCGAATCAGCCTTTTCACCCTTAATCTAACCCTAACCCTAACCC
+CTAACCCTAACCCTACCCCCCCCCACACCCCCCCAACGCCACCACTGACACTAACCCTCT
+CCCTGACACTAACCCTGACCATAACCACTTACTACCCACTTGCCAAACCGTAACCCTTAC
+CTTTGCCTAAGGTTACTACCCACAAGGGTTACCATTTTCAGACATCGGAAGGGGGGTCCA
+AACCACTCGGGGGACCATGAAACGTGCTCCTACACACTTTCTGGGGGACACTTTTGGCCT
+TTGCCCAAGCGTAACCCTTACCTTTGCCTAGGTTTACTACCCACAAGGTTTACAATTTTC
+ATACATTCAAAGGGGGGTCCAAACGACTCAGGGGGCTCTGAAACGTGCTCCTAGACACTT
+TCTGGGGGACACTTTTGGGCTATGCCACTTTGTCATATTATCACACTTTTCCATATTCCC
+ATACACATACATGGGAATATTAATATGGCCATAACTTTTGAACGGAACATCACAGAGCTT
+CAGGACCACCACCGTTGGACTCAGGGTACATCAAATAGGGGGGGTAGACAAACTTTCAAC
+CTTCTAGCTCCAAAAAAAATCTTCAGCATTTTTGCTGACATCAGCCTTTTCACCCTTAAT
+CTAACGGAACATCACAGAGCTTCAGGACCACCACCGTTGGACTCAGGGTACATCAAATAG
+GGGGGGTAGACAAACTTTCAACCTTCTAGCTCCAAATAAAAAGTTTGTCCCTTTTTGCCC
+GAATCAGCCTTTTCACCCTTAATCTAACCCCCTAACCCTAACCCTAACCCTAACCCTAAC
+CCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCCCTAACCCTAACCCTAACCCTA
+ACCCTAACCCTAACCCTAACCCTACCCTACCCTAACCCTAACCCTAACCCTAACCCTAAC
+CCTAACCCTGACCACCACCGTTGGACTCAGGGTACATCAAATAGGGGGGGTAGACAAACT
+TTCAACCTTCTAGCTCCAAATAAAAAGTTTGTCCCTTTTTGCCCGAATCAGCCTTTTCAC
+CCTTAATCTAACCCTAACCCTAACCCAAACTTTCAACCTTCTAGCTCCAAATAAAAAGTT
+CGGCAACTTTTGCCGAATCAGCCTTTTCACCCTTAATCTAACCCTAACCCCTAACCCCTA
+ACCCTAACCCTAACCCCCCCCCCTAACCCTAACCCTAACCCTAACCCCCTAACCCAAAAA
+CAGTACTAAACTTAAAGAACTACAAACAAACTATGTATCCCTGGACTGGGTGGCGTAGGG
+ACTGGTGTCCCCAACGCACTCGCCAGGAATACTGGGGCCGGGGGGACAGGCGGTATGCGG
+GTTGGATGGACCGTGCACCTTCCTTCCCTGCTTGGGGAGGGACTCGGACCCGATTCCCTA
+ACCCTAACCCTAACCCTTAATCTAACCCTAACCCCCCTAACCCTAACCCGCCACTGACAC
+TAACCCTCTCCCTGACACTAACCCTGACCATAACCACTTACTACCCACTTGCCAAACCAT
+AACCCTTACCTTTGCCTAAGGTTACTACCCACAAGGGTTACCATTTTCAGACATCGGAAG
+GGGGGTCCAAACCACTCGGGGGACCATGAAACGTGCTCCTACACACTTTCTGGGGGACAC
+TTTTGGCCTTTGCCCAAGCGTAACCCTTACCTTTGCCTACCTTTACTACCCACAAGGTTT
+ACCATTTTCATACATTCAAAGGGGGGTCCAAACGACTCAGGGGGCTCTGAAACGTGCTCC
+TAGACACTTTCTGGGGGACACTTTTGGGCTATGCCACTTTGTCATATTATCACACTTTTC
+CATATTCCCATACACATACATGGGAATATTAATATGGCCATAACTTTTGAACGGAACATC
+ACAGAGCTTCAGGACCACCACCGTTGGACTCAGGGTACATCAAATAGGGGGGGTAGACAA
+ACTTTCAACCTTCTAGCTCCAAAAAAAATCTTCAGCATTTTTGCTGACATCAGCCTTTTC
+ACCCTTAATCTACCCCCCCCGCACCCCCCCCAACGCCGCCACTGACACTAACCCTCTCCC
+TGACACTAACCCTGACCATAACCACTTACTACCCACTTGCCAAACCGTAACCCTTACCTT
+TGCCTAAGGTTACTACCCACAAGGGTTACCATTTTCAGACATCGGAAGGGGGGTCCAAAC
+CACTCGGGGGACCATGAAACGTGCTCCTACACACTTTCTGGGGGACACTTTTGGCCTTTG
+CCCAAGCGTAACCCTTACCTTTGCCTACCTTTACTACCCACAAGCTTTACCATTTTCATA
+CATCGGAAGGGGGGTCCAAACCACTCGGGGGACCATGAAACGTGCTCCTACACACTTTCT
+GGGGGACACTTTTGGGCTATGGCACTTTGTCATATTATCACACTTTTCCATATTCCCATA
+CACATACATGGGAATATTAATATGGCCATAACTTTTGAACGGAACATCACAGAGCTTCAG
+GACCACCACCGTTGGACTCAGGGTACATCAAATAGGGGGGGTAGACAAACTTTCAACCTT
+CTAGCTCCAAATAAAAAGTTCGGCAACTTTTGCCGAATCAGCCTTTTCACCCTTAATCTA
+ACCCTAACCCCTAACCCCTAACCCTAACCCTAACCCCCCCCCCTAACCCTAACCCTAACC
+CTAACCCCCTAACCCAAAAACAGTACTAAACTTAAAGAACTACAAACAAACTATGTATCC
+CTGGACTGGGTGGCGTAGGGACTGGTGTCCCCAACGCACTCGCCAGGAATACTGGGGCCG
+GGGGGACAGGCGGTATGCGGGTTGGATGGACCGTGCACCTTCCTTCCCTGCTTGGGGAGG
+GACTCGGACCCGATTCCCTAACCCTAACCCTAACCCTTAATCTAACCCTAACCCCCCTAA
+CCCTAACCCGCCACTGACACTAACCCTCTCCCTGACACTAACCCTGACCATAACCACTTA
+CTACCCACTTGCCAAACCATAACCCTTACCTTTGCCTAAGGTTACTACCCACAAGGGTTA
+CCATTTTCAGACATCGGAAGGGGGGTCCAAACCACTCGGGGGACCATGAAACGTGCTCCT
+ACACACTTTCTGGGGGACACTTTTGGCCTTTGCCCAAGCGTAACCCTTACCTTTGCCTAC
+CTTTACTACCCACAAGGTTTACCATTTTCATACATTCAAAGGGGGGTCCAAACGACTCAG
+GGGGCTCTGAAACGTGCTCCTAGACACTTTCTGGGGGACACTTTTGGGCTATGCCACTTT
+GTCATATTATCACACTTTTCCATATTCCCATACACATACATGGGAATATTAATATGGCCA
+TAACTTTTGAACGGAACATCACAGAGCTTCAGGACCACCACCGTTGGACTCAGGGTACAT
+CAAATAGGGGGGGTAGACAAACTTTCAACCTTCTAGCTCCAAAAAAAATCTTCAGCATTT
+TTGCTGACATCAGCCTTTTCACCCTTAATCTAACCCTAACCCCCTAACCCAAAAACAGTA
+CTAAACTTAAAGAACTACAAACAAACTATGTATCCCTGGACTGGGTGGCGTAGGGACTGG
+TGTCCCCAACGCACTCGCCAGGAATACTGGGGCCGGGGGGACAGGCGGTATGCGGGTTGG
+ATGGACCGTGCACCTTCCTTCCCTGCTTGGGGAGGGACTCGGACCCGATTCCCTAACCCT
+AACCCTAACCCTTAATCTAACCCTAACCCCCCTAACCCTAACCCGCCACTGACACTAACC
+CTCTCCCTGACACTAACCCTGACCATAACCACTTACTACCCACTTGCCAAACCATAACCC
+TTACCTTTGCCTAAGGTTACTACCCACAAGGGTTACCATTTTCAGACATCGGAAGGGGGG
+TCCAAACCACTCGGGGGACCATGAAACGTGCTCCTACACACTTTCTGGGGGACACTTTTG
+GCCTTTGCCCAAGCGTAACCCTTACCTTTGCCTACCTTTACTACCCACAAGGTTTACCAT
+TTTCATACATTCAAAGGGGGGTCCAAACGACTCAGGGGGCTCTGAAACGTGCTCCTAGAC
+ACTTTCTGGGGGACACTTTTGGGCTATGCCACTTTGTCATATTATCACACTTTTCCATAT
+TCCCATACACATACATGGGAATATTAATATGGCCATAACTTTTGAACGGAACATCACAGA
+GCTTCAGGACCACCACCGTTGGACTCAGGGTACATCAAATAGGGGGGTAGACAAACTTTC
+AACCTTCTAGCTCCAAAAAAAATCTTCAGCATTTTTGCTGACATCAGCCTTTTCACCCTT
+AATCTACCCCCCCCGCACCCCCCCCAACGCCGCCACTGACACTAACCCTCTCCCTGACAC
+TAACCCTGACCATAACCACTTACTACCCACTTGCCAAACCGTAACCCTTACCTTTGCCTA
+AGGTTACTACCCACAAGGGTTACCATTTTCAGACATCGGAAGGGGGGTCCAAACCACTCG
+GGGGACCATGAAACGTGCTCCTACACACTTTCTGGGGGACACTTTTGGCCTTTGCCCAAG
+CGTAACCCTTACCTTTGCCTACCTTTACTACCCACAAGCTTTACCATTTTCATACATCGG
+AAGGGGGGTCCAAACCACTCGGGGGACCATGAAACGTGCTCCTACACACTTTCTGGGGGA
+CACTTTTGGGCTATGGCACTTTGTCATATTATCACACTTTTCCATATTCCCATACACATA
+CATGGGAATATTAATATGGCCATAACTTTTGAACGGAACATCACAGAGCTTCAGGACCAC
+CACCGTTGGACTCAGGGTACATCAAATAGGGGGGGTAGACAAACTTTCAACCTTCTAGCT
+CCAAATAAAAAGTTCGGCAACTTTTGCCGAATCAGCCTTTTCACCCTTAATCTAACCCTA
+ACCCCTAACCCCTAACCCTAACCCTAACCCCCCCCCCTAACCCTAACCCTAACCCTAACC
+CCCTAACCCAAAAACAGTACTAAACTTAAAGAACTACAAACAAACTATGTATCCCTGGAC
+TGGGTGGCGTAGGGACTGGTGTCCCCAACGCACTCGCCAGGAATACTGGGGCCGGGGGGA
+CAGGCGGTATGCGGGTTGGATGGACCGTGCACCTTCCTTCCCTGCTTGGGGAGGGACTCG
+GACCCGATTCCCTAACCCTAACCCTAACCCTTAATCTAACCCTAACCCCCCTAACCCTAA
+CCCGCCACTGACACTAACCCTCTCCCTGACACTAACCCTGACCATAACCACTTACTACCC
+ACTTGCCAAACCATAACCCTTACCTTTGCCTAAGGTTACTACCCACAAGGGTTACCATTT
+TCAGACATCGGAAGGGGGGTCCAAACCACTCGGGGGACCATGAAACGTGCTCCTACACAC
+TTTCTGGGGGACACTTTTGGCCTTTGCCCAAGCGTAACCCTTACCTTTGCCTACCTTTAC
+TACCCACAAGGTTTACCATTTTCATACATTCAAAGGGGGGTCCAAACGACTCAGGGGGCT
+CTGAAACGTGCTCCTAGACACTTTCTGGGGGACACTTTTGGGCTATGCCACTTTGTCATA
+TTATCACACTTTTCCATATTCCCATACACATACATGGGAATATTAATATGGCCATAACTT
+TTGAACGGAACATCACAGAGCTTCAGGACCACCACCGTTGGACTCAGGGTACATCAAATA
+GGGGGGGTAGACAAACTTTCAACCTTCTAGCTCCAAAAAAAATCTTCAGCATTTTTGCTG
+ACATCAGCCTTTTCACCCTTAATCTACCCCCCCCGCACCCCCCCCAACGCCGCCACTGAC
+ACTAACCCTCTCCCTGACACTAACCCTGACCATAACCACTTACTACCCACTTGCCAAACC
+GTAACCCTTACCTTTGCCTAAGGTTACT
+>SUPER_2
+AACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGT
+TAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTC
+CGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTG
+TCATAGAATGACATTTCCACTTTAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCA
+TGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTG
+CTTTTCTCGCTCAAAAAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGA
+TTTTATTTGTCAAACTGTCATAGAATGACGCGCTAATTTCCACTTGAGTAAACATCAATT
+CTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAA
+AGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAA
+ATGACAGAATATGAGTATTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGA
+CATTTCCACTTGAGAAACATCAATTCTTTGCATGTTTTTGAAGGACAGCATGGTTTATTT
+TGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGC
+TCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTA
+TTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATG
+TTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGT
+ACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGA
+ATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCC
+ACTTTAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCG
+TGTTGAGTTAGTGTGAAAAGTGAGGTATATGTTCATTTTGTGCTTTTCTCGCTCAAATAG
+CGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTG
+TCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAA
+GGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGACATGTTCA
+TTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTA
+TTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAA
+ACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTT
+AGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCC
+GACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGT
+CATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCAT
+GGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTCATTTTGTGC
+TTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGAT
+TCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTTAGAAACATCAAT
+TCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAA
+AAGTGAGGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAA
+AATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAAT
+GACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATT
+TTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCG
+CTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGT
+ATTTATTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATG
+TTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGT
+ATATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGA
+ATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCC
+ACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCG
+TGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAG
+CGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTG
+TCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAA
+GGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTC
+ATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGT
+ATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGA
+AACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGT
+TAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGAGTTATTC
+CGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTG
+TCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCA
+TGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTCATTTTGTG
+CTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGA
+TTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAA
+TTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGA
+AAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGA
+AAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAA
+TGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTAT
+TTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTCATTTTGTGCTTTTCTC
+GCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTG
+TATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCA
+TGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCA
+GTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACA
+GAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTT
+CCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATT
+CGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTCATTTTGTGCTTTTCTCGCTCAAAT
+AGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATT
+TGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTG
+AAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGT
+TCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGA
+GTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATCACATTTCCACTTGA
+GAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGA
+GTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGAGTTAT
+TCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAAC
+TGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAG
+CATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTCATTTTG
+TGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTA
+GATTCATTTGTATTTATTTGTCAAACTGTCATAGAATTATTCCGACCTGAAAATGACAGA
+ATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCC
+ACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCG
+TGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAG
+CGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTG
+TCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAA
+GGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTC
+ATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGT
+ATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGA
+AACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGT
+TAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTC
+CGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTG
+TCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCA
+TGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTCATTTTGTG
+CTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGA
+TTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAA
+TTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGA
+AAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGA
+AAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAA
+TGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTAT
+TTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTCATTTTGTGCTTTTCTC
+GCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTG
+TATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCA
+TGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCA
+GTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGAGTTATTCCGACCTGAAAATGACA
+GAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTT
+CCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATT
+CGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTCATTTTGTGCTTTTCTCGCTCAAAT
+AGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATT
+TGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTG
+AAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTACATGT
+TCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGA
+GTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGA
+GAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGA
+GTTAGTGTGAAAAGTGCAGTATATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTAT
+TCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAAC
+TGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAG
+CATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTCATTTTG
+TGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTA
+GATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTTAGAAACATC
+AATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGT
+GAAAAGTGCAGTATATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCT
+GAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAG
+AATGACATTTCCACTTTAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTT
+ATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGAGGTACATGTTCATTTTGTGCTTTTC
+TCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATT
+TGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTG
+CATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTG
+CAGTATATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGA
+CAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACAT
+TTCCACTTTAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAA
+TTCGTGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAA
+ATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTA
+TTTGTCAAACTGTCATAGAATGACATTTCCACTTTAGAAACATCAATTCTTGCATGTTTT
+TGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGAGGTACAT
+GTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATAT
+GAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTT
+TAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTT
+GAGTTAGTGTGAAAAGTGAGGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTT
+ATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAA
+ACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGAC
+AGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTT
+TGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTT
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/expected_hap1_inter_chr.tsv	Wed Jan 07 12:48:27 2026 +0000
@@ -0,0 +1,2 @@
+Scaffold_33	SUPER_1
+Scaffold_35	SUPER_2
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/expected_hap1_unlocs_no_hapdups.agp	Wed Jan 07 12:48:27 2026 +0000
@@ -0,0 +1,2 @@
+Scaffold_33	1	4414	1	W	scaffold_16.hap1	1	4414	+	Painted	Hap_1	
+Scaffold_35	1	4409	1	W	scaffold_17.hap1	1	4409	+	Painted	Hap_1	
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/expected_hap2.agp	Wed Jan 07 12:48:27 2026 +0000
@@ -0,0 +1,2 @@
+Scaffold_34	1	4303	1	W	scaffold_17.hap2	1	4303	+	Painted	Hap_2	
+Scaffold_36	1	4299	1	W	scaffold_16.hap2	1	4299	+	Painted	Hap_2	
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/expected_hap2_inter_chr.tsv	Wed Jan 07 12:48:27 2026 +0000
@@ -0,0 +1,2 @@
+Scaffold_36	SUPER_1
+Scaffold_34	SUPER_2
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/expected_hap2_unlocs_no_hapdups.agp	Wed Jan 07 12:48:27 2026 +0000
@@ -0,0 +1,2 @@
+Scaffold_34	1	4303	1	W	scaffold_17.hap2	1	4303	+	Painted	Hap_2	
+Scaffold_36	1	4299	1	W	scaffold_16.hap2	1	4299	+	Painted	Hap_2	
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/expected_orientation.tsv	Wed Jan 07 12:48:27 2026 +0000
@@ -0,0 +1,3 @@
+	Hap_1	Hap_2	Main Orientation
+0	SUPER_1	SUPER_2	-
+1	SUPER_2	SUPER_1	-
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/expected_reversing_renaming.sak	Wed Jan 07 12:48:27 2026 +0000
@@ -0,0 +1,4 @@
+RVCP	SUPER_2_oldname	
+RVCP	SUPER_1_oldname	
+RENAME	SUPER_2_oldname	SUPER_1
+RENAME	SUPER_1_oldname	SUPER_2
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/test_hap1_sorted.fa	Wed Jan 07 12:48:27 2026 +0000
@@ -0,0 +1,4 @@
+>Scaffold_33
+CCCACACCCACCCCACCCCACCCCCACCCCCACCCCCCACACCCCACCCCACCCCACCCCCACCCCTACCCCCCCACCCCCAACCCACCCCCACCCACCCACCCCTCACCCCACCCTACCCCCAACCCCTCCCCCACCCCACCCAACCCACCCCTACCCTAACCCTAACCCTAACCCTACCCCTAACCTACCCTACCCTACCCTACCCACCCTAACCCTACCCTAACCCTAACCCTAACCCCTAACCCTAACCCTACCCTAACCCTAACCCTAACCCTAACCCTACCCCTAACCCTAACCCTAACCCTAACCCTAACCCTACCCCTAACCCTAACCCTAACCCTACCCAACCCTACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCCCTAACCCTAACCCTAACCCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTACCCTAACCCTAACCCTAACCCTAACCCTAACCCTACCCTAACCCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCCTAACCCTAACCCTAACCCTAACCCTAACCCTACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCCCTAACCCTAACCCTAACCCTACCCTACCCTAACCCTAACCCTAACCCTAACCCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTACCCTAACCCTAACCCTAACCCTAACCCCCCCCCCCTAACCCTACCCTAACCCCTAACCCTACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCCCCTAACCCCTAACCCTACCCTAACCCTAACCCTAACCCTAACCCTACCCTAACCCTACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCCTAACCCTAACCCTACCCTAACCCTAACCCCTAACCCTAACCCTAACCCTAACCCCTAACCCACTCGCCAGGAATACTGGGGCCGGGGGGACAGGCGGTATGCGGGTTGGATGGACCGTGCACCTTCCTTCCCTGCTTGGGGAGGGACTCGGACCCGATTCCCTAACCCTAACCCTAACCCTTAATCTAACCCTAACCCCCCTAACCCTAACCCGCCACTGACACTAACCCTCTCCCTGACACTAACCCTGACCATAACCACTTACTACCCACTTGCCAAACCATAACCCTTACCTTTGCCTAAGGTTACTACCCACAAGGGTTACCATTTTCAGACATCGGAAGGGGGGTCCAAACCACTCGGGGGACCATGAAACGTGCTCCTACACACTTTCTGGGGGACACTTTTGGCCTTTGCCCAAGCGTAACCCTTACCTTTGCCTACCTTTACTACCCACAAGGTTTACCATTTTCATACATTCAAAGGGGGGTCCAAACGACTCAGGGGGCTCTGAAACGTGCTCCTAGACACTTTCTGGGGGACACTTTTGGGCTATGCCACTTTGTCATATTATCACACTTTTCCATATTCCCATACACATACATGGGAATATTAATATGGCCATAACTTTTGAACGGAACATCACAGAGCTTCAGGACCACCACCGTTGGACTCAGGGTACATCAAATAGGGGGGGTAGACAAACTTTCAACCTTCTAGCTCCAAAAAAAATCTTCAGCATTTTTGCTGACATCAGCCTTTTCACCCTTAATCTACCCCCCCCGCACCCCCCCCAACGCCGCCACTGACACTAACCCTCTCCCTGACACTAACCCTGACCATAACCACTTACTACCCACTTGCCAAACCGTAACCCTTACCTTTGCCTAAGGTTACTACCCACAAGGGTTACCATTTTCAGACATCGGAAGGGGGGTCCAAACCACTCGGGGGACCATGAAACGTGCTCCTACACACTTTCTGGGGGACACTTTTGGCCTTTGCCCAAGCGTAACCCTTACCTTTGCCTACCTTTACTACCCACAAGCTTTACCATTTTCATACATCGGAAGGGGGGTCCAAACCACTCGGGGGACCATGAAACGTGCTCCTACACACTTTCTGGGGGACACTTTTGGGCTATGGCACTTTGTCATATTATCACACTTTTCCATATTCCCATACACATACATGGGAATATTAATATGGCCATAACTTTTGAACGGAACATCACAGAGCTTCAGGACCACCACCGTTGGACTCAGGGTACATCAAATAGGGGGGGTAGACAAACTTTCAACCTTCTAGCTCCAAATAAAAAGTTCGGCAACTTTTGCCGAATCAGCCTTTTCACCCTTAATCTAACCCTAACCCCTAACCCCTAACCCTAACCCTAACCCCCCCCCCTAACCCTAACCCTAACCCTAACCCCCTAACCCAAAAACAGTACTAAACTTAAAGAACTACAAACAAACTATGTATCCCTGGACTGGGTGGCGTAGGGACTGGTGTCCCCAACGCACTCGCCAGGAATACTGGGGCCGGGGGGACAGGCGGTATGCGGGTTGGATGGACCGTGCACCTTCCTTCCCTGCTTGGGGAGGGACTCGGACCCGATTCCCTAACCCTAACCCTAACCCTTAATCTAACCCTAACCCCCCTAACCCTAACCCGCCACTGACACTAACCCTCTCCCTGACACTAACCCTGACCATAACCACTTACTACCCACTTGCCAAACCATAACCCTTACCTTTGCCTAAGGTTACTACCCACAAGGGTTACCATTTTCAGACATCGGAAGGGGGGTCCAAACCACTCGGGGGACCATGAAACGTGCTCCTACACACTTTCTGGGGGACACTTTTGGCCTTTGCCCAAGCGTAACCCTTACCTTTGCCTACCTTTACTACCCACAAGGTTTACCATTTTCATACATTCAAAGGGGGGTCCAAACGACTCAGGGGGCTCTGAAACGTGCTCCTAGACACTTTCTGGGGGACACTTTTGGGCTATGCCACTTTGTCATATTATCACACTTTTCCATATTCCCATACACATACATGGGAATATTAATATGGCCATAACTTTTGAACGGAACATCACAGAGCTTCAGGACCACCACCGTTGGACTCAGGGTACATCAAATAGGGGGGGTAGACAAACTTTCAACCTTCTAGCTCCAAAAAAAATCTTCAGCATTTTTGCTGACATCAGCCTTTTCACCCTTAATCTACCCCCCCCGCACCCCCCCCAACGCCGCCACTGACACTAACCCTCTCCCTGACACTAACCCTGACCATAACCACTTACTACCCACTTGCCAAACCGTAACCCTTACCTTTGCCTAAGGTTACTACCCACAAGGGTTACCATTTTCAGACATCGGAAGGGGGGTCCAAACCACTCGGGGGACCATGAAACGTGCTCCTACACACTTTCTGGGGGACACTTTTGGCCTTTGCCCAAGCGTAACCCTTACCTTTGCCTACCTTTACTACCCACAAGCTTTACCATTTTCATACATCGGAAGGGGGGTCCAAACCACTCGGGGGACCATGAAACGTGCTCCTACACACTTTCTGGGGGACACTTTTGGGCTATGGCACTTTGTCATATTATCACACTTTTCCATATTCCCATACACATACATGGGAATATTAATATGGCCATAACTTTTGAACGGAACATCACAGAGCTTCAGGACCACCACCGTTGGACTCAGGGTACATCAAATAGGGGGGGTAGACAAACTTTCAACCTTCTAGCTCCAAATAAAAAGTTCGGCAACTTTTGCCGAATCAGCCTTTTCACCCTTAATCTAACCCTACCCTAACTTTTGCCGAATCAGCCTTTTCACCCTTAATCTAACCCTAACCCTAACCCCTAACCCTAACCCTACCCCCCCCCACACCCCCCCAACGCCACCACTGACACTAACCCTCTCCCTGACACTAACCCTGACCATAACCACTTACTACCCACTTGCCAAACCGTAACCCTTACCTTTGCCTAAGGTTACTACCCACAAGGGTTACCATTTTCAGACATCGGAAGGGGGGTCCAAACCACTCGGGGGACCATGAAACGTGCTCCTACACACTTTCTGGGGGACACTTTTGGCCTTTGCCCAAGCGTAACCCTTACCTTTGCCTAGGTTTACTACCCACAAGGTTTACAATTTTCATACATTCAAAGGGGGGTCCAAACGACTCAGGGGGCTCTGAAACGTGCTCCTAGACACTTTCTGGGGGACACTTTTGGGCTATGCCACTTTGTCATATTATCACACTTTTCCATATTCCCATACACATACATGGGAATATTAATATGGCCATAACTTTTGAACGGAACATCACAGAGCTTCAGGACCACCACCGTTGGACTCAGGGTACATCAAATAGGGGGGGTAGACAAACTTTCAACCTTCTAGCTCCAAAAAAAATCTTCAGCATTTTTGCTGACATCAGCCTTTTCACCCTTAATCTAACGGAACATCACAGAGCTTCAGGACCACCACCGTTGGACTCAGGGTACATCAAATAGGGGGGGTAGACAAACTTTCAACCTTCTAGCTCCAAATAAAAAGTTTGTCCCTTTTTGCCCGAATCAGCCTTTTCACCCTTAATCTAACCCCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTACCCTACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTGACCACCACCGTTGGACTCAGGGTACATCAAATAGGGGGGGTAGACAAACTTTCAACCTTCTAGCTCCAAATAAAAAGTTTGTCCCTTTTTGCCCGAATCAGCCTTTTCACCCTTAATCTAACCCTAACCCTAACCCAAACTTTCAACCTTCTAGCTCCAAATAAAAAGTTCGGCAACTTTTGCCGAATCAGCCTTTTCACCCTTAATCTAACCCTAACCCCTAACCCCTAACCCTAACCCTAACCCCCCCCCCTAACCCTAACCCTAACCCTAACCCCCTAACCCAAAAACAGTACTAAACTTAAAGAACTACAAACAAACTATGTATCCCTGGACTGGGTGGCGTAGGGACTGGTGTCCCCAACGCACTCGCCAGGAATACTGGGGCCGGGGGGACAGGCGGTATGCGGGTTGGATGGACCGTGCACCTTCCTTCCCTGCTTGGGGAGGGACTCGGACCCGATTCCCTAACCCTAACCCTAACCCTTAATCTAACCCTAACCCCCCTAACCCTAACCCGCCACTGACACTAACCCTCTCCCTGACACTAACCCTGACCATAACCACTTACTACCCACTTGCCAAACCATAACCCTTACCTTTGCCTAAGGTTACTACCCACAAGGGTTACCATTTTCAGACATCGGAAGGGGGGTCCAAACCACTCGGGGGACCATGAAACGTGCTCCTACACACTTTCTGGGGGACACTTTTGGCCTTTGCCCAAGCGTAACCCTTACCTTTGCCTACCTTTACTACCCACAAGGTTTACCATTTTCATACATTCAAAGGGGGGTCCAAACGACTCAGGGGGCTCTGAAACGTGCTCCTAGACACTTTCTGGGGGACACTTTTGGGCTATGCCACTTTGTCATATTATCACACTTTTCCATATTCCCATACACATACATGGGAATATTAATATGGCCATAACTTTTGAACGGAACATCACAGAGCTTCAGGACCACCACCGTTGGACTCAGGGTACATCAAATAGGGGGGGTAGACAAACTTTCAACCTTCTAGCTCCAAAAAAAATCTTCAGCATTTTTGCTGACATCAGCCTTTTCACCCTTAATCTACCCCCCCCGCACCCCCCCCAACGCCGCCACTGACACTAACCCTCTCCCTGACACTAACCCTGACCATAACCACTTACTACCCACTTGCCAAACCGTAACCCTTACCTTTGCCTAAGGTTACTACCCACAAGGGTTACCATTTTCAGACATCGGAAGGGGGGTCCAAACCACTCGGGGGACCATGAAACGTGCTCCTACACACTTTCTGGGGGACACTTTTGGCCTTTGCCCAAGCGTAACCCTTACCTTTGCCTACCTTTACTACCCACAAGCTTTACCATTTTCATACATCGGAAGGGGGGTCCAAACCACTCGGGGGACCATGAAACGTGCTCCTACACACTTTCTGGGGGACACTTTTGGGCTATGGCACTTTGTCATATTATCACACTTTTCCATATTCCCATACACATACATGGGAATATTAATATGGCCATAACTTTTGAACGGAACATCACAGAGCTTCAGGACCACCACCGTTGGACTCAGGGTACATCAAATAGGGGGGGTAGACAAACTTTCAACCTTCTAGCTCCAAATAAAAAGTTCGGCAACTTTTGCCGAATCAGCCTTTTCACCCTTAATCTAACCCTAACCCCTAACCCCTAACCCTAACCCTAACCCCCCCCCCTAACCCTAACCCTAACCCTAACCCCCTAACCCAAAAACAGTACTAAACTTAAAGAACTACAAACAAACTATGTATCCCTGGACTGGGTGGCGTAGGGACTGGTGTCCCCAACGCACTCGCCAGGAATACTGGGGCCGGGGGGACAGGCGGTATGCGGGTTGGATGGACCGTGCACCTTCCTTCCCTGCTTGGGGAGGGACTCGGACCCGATTCCCTAACCCTAACCCTAACCCTTAATCTAACCCTAACCCCCCTAACCCTAACCCGCCACTGACACTAACCCTCTCCCTGACACTAACCCTGACCATAACCACTTACTACCCACTTGCCAAACCATAACCCTTACCTTTGCCTAAGGTTACTACCCACAAGGGTTACCATTTTCAGACATCGGAAGGGGGGTCCAAACCACTCGGGGGACCATGAAACGTGCTCCTACACACTTTCTGGGGGACACTTTTGGCCTTTGCCCAAGCGTAACCCTTACCTTTGCCTACCTTTACTACCCACAAGGTTTACCATTTTCATACATTCAAAGGGGGGTCCAAACGACTCAGGGGGCTCTGAAACGTGCTCCTAGACACTTTCTGGGGGACACTTTTGGGCTATGCCACTTTGTCATATTATCACACTTTTCCATATTCCCATACACATACATGGGAATATTAATATGGCCATAACTTTTGAACGGAACATCACAGAGCTTCAGGACCACCACCGTTGGACTCAGGGTACATCAAATAGGGGGGGTAGACAAACTTTCAACCTTCTAGCTCCAAAAAAAATCTTCAGCATTTTTGCTGACATCAGCCTTTTCACCCTTAATCTAACCCTAACCCCCTAACCCAAAAACAGTACTAAACTTAAAGAACTACAAACAAACTATGTATCCCTGGACTGGGTGGCGTAGGGACTGGTGTCCCCAACGCACTCGCCAGGAATACTGGGGCCGGGGGGACAGGCGGTATGCGGGTTGGATGGACCGTGCACCTTCCTTCCCTGCTTGGGGAGGGACTCGGACCCGATTCCCTAACCCTAACCCTAACCCTTAATCTAACCCTAACCCCCCTAACCCTAACCCGCCACTGACACTAACCCTCTCCCTGACACTAACCCTGACCATAACCACTTACTACCCACTTGCCAAACCATAACCCTTACCTTTGCCTAAGGTTACTACCCACAAGGGTTACCATTTTCAGACATCGGAAGGGGGGTCCAAACCACTCGGGGGACCATGAAACGTGCTCCTACACACTTTCTGGGGGACACTTTTGGCCTTTGCCCAAGCGTAACCCTTACCTTTGCCTACCTTTACTACCCACAAGGTTTACCATTTTCATACATTCAAAGGGGGGTCCAAACGACTCAGGGGGCTCTGAAACGTGCTCCTAGACACTTTCTGGGGGACACTTTTGGGCTATGCCACTTTGTCATATTATCACACTTTTCCATATTCCCATACACATACATGGGAATATTAATATGGCCATAACTTTTGAACGGAACATCACAGAGCTTCAGGACCACCACCGTTGGACTCAGGGTACATCAAATAGGGGGGTAGACAAACTTTCAACCTTCTAGCTCCAAAAAAAATCTTCAGCATTTTTGCTGACATCAGCCTTTTCACCCTTAATCTACCCCCCCCGCACCCCCCCCAACGCCGCCACTGACACTAACCCTCTCCCTGACACTAACCCTGACCATAACCACTTACTACCCACTTGCCAAACCGTAACCCTTACCTTTGCCTAAGGTTACTACCCACAAGGGTTACCATTTTCAGACATCGGAAGGGGGGTCCAAACCACTCGGGGGACCATGAAACGTGCTCCTACACACTTTCTGGGGGACACTTTTGGCCTTTGCCCAAGCGTAACCCTTACCTTTGCCTACCTTTACTACCCACAAGCTTTACCATTTTCATACATCGGAAGGGGGGTCCAAACCACTCGGGGGACCATGAAACGTGCTCCTACACACTTTCTGGGGGACACTTTTGGGCTATGGCACTTTGTCATATTATCACACTTTTCCATATTCCCATACACATACATGGGAATATTAATATGGCCATAACTTTTGAACGGAACATCACAGAGCTTCAGGACCACCACCGTTGGACTCAGGGTACATCAAATAGGGGGGGTAGACAAACTTTCAACCTTCTAGCTCCAAATAAAAAGTTCGGCAACTTTTGCCGAATCAGCCTTTTCACCCTTAATCTAACCCTAACCCCTAACCCCTAACCCTAACCCTAACCCCCCCCCCTAACCCTAACCCTAACCCTAACCCCCTAACCCAAAAACAGTACTAAACTTAAAGAACTACAAACAAACTATGTATCCCTGGACTGGGTGGCGTAGGGACTGGTGTCCCCAACGCACTCGCCAGGAATACTGGGGCCGGGGGGACAGGCGGTATGCGGGTTGGATGGACCGTGCACCTTCCTTCCCTGCTTGGGGAGGGACTCGGACCCGATTCCCTAACCCTAACCCTAACCCTTAATCTAACCCTAACCCCCCTAACCCTAACCCGCCACTGACACTAACCCTCTCCCTGACACTAACCCTGACCATAACCACTTACTACCCACTTGCCAAACCATAACCCTTACCTTTGCCTAAGGTTACTACCCACAAGGGTTACCATTTTCAGACATCGGAAGGGGGGTCCAAACCACTCGGGGGACCATGAAACGTGCTCCTACACACTTTCTGGGGGACACTTTTGGCCTTTGCCCAAGCGTAACCCTTACCTTTGCCTACCTTTACTACCCACAAGGTTTACCATTTTCATACATTCAAAGGGGGGTCCAAACGACTCAGGGGGCTCTGAAACGTGCTCCTAGACACTTTCTGGGGGACACTTTTGGGCTATGCCACTTTGTCATATTATCACACTTTTCCATATTCCCATACACATACATGGGAATATTAATATGGCCATAACTTTTGAACGGAACATCACAGAGCTTCAGGACCACCACCGTTGGACTCAGGGTACATCAAATAGGGGGGGTAGACAAACTTTCAACCTTCTAGCTCCAAAAAAAATCTTCAGCATTTTTGCTGACATCAGCCTTTTCACCCTTAATCTACCCCCCCCGCACCCCCCCCAACGCCGCCACTGACACTAACCCTCTCCCTGACACTAACCCTGACCATAACCACTTACTACCCACTTGCCAAACCGTAACCCTTACCTTTGCCTAAGGTTACT
+>Scaffold_35
+AACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTTAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAAAAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTTTATTTGTCAAACTGTCATAGAATGACGCGCTAATTTCCACTTGAGTAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTTAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGAGGTATATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTTAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGAGGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGAGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATCACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGAGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGAGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTTAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTTAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGAGGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTTAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTTAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGAGGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTTAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGAGGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTT
\ No newline at end of file
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/test_hap1_unlocs_no_hapdups.agp	Wed Jan 07 12:48:27 2026 +0000
@@ -0,0 +1,2 @@
+Scaffold_33	1	24739779	1	W	scaffold_16.hap1	1	24739779	+	Painted	Hap_1	
+Scaffold_35	1	24437540	1	W	scaffold_17.hap1	1	24437540	+	Painted	Hap_1	
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/test_input.agp	Wed Jan 07 12:48:27 2026 +0000
@@ -0,0 +1,7 @@
+##agp-version	2.1
+# DESCRIPTION: Generated by PretextViewAI Version 1.0.0
+# HiC MAP RESOLUTION: 39904.841797 bp/texel
+Scaffold_33	1	24741001	1	W	scaffold_16.hap1	1	24741001	+	Painted	Hap_1	
+Scaffold_34	1	24461668	1	W	scaffold_17.hap2	1	24461668	+	Painted	Hap_2	
+Scaffold_35	1	24461668	1	W	scaffold_17.hap1	1	24461668	+	Painted	Hap_1	
+Scaffold_36	1	24581382	1	W	scaffold_16.hap2	1	24581382	+	Painted	Hap_2	
Binary file test-data/test_input.fasta.gz has changed
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/test_mashmap.out	Wed Jan 07 12:48:27 2026 +0000
@@ -0,0 +1,10 @@
+SUPER_1	24569333	0	24150000	-	SUPER_2	24437540	419743	24421883	41	24150000	22	id:f:0.994373	kc:f:0.991464
+SUPER_1	24569333	24150000	24569333	-	SUPER_2	24437540	12170	362135	5	419333	17	id:f:0.978691	kc:f:0.509185
+SUPER_2	24463642	0	10750000	-	SUPER_1	24739779	13979195	24724929	41	10750000	22	id:f:0.994281	kc:f:0.996774
+SUPER_2	24463642	10750000	10800000	-	SUPER_1	24739779	13806614	13856614	18	50000	15	id:f:0.967081	kc:f:0.518457
+SUPER_2	24463642	10800000	10850000	-	SUPER_1	24739779	13929079	13979079	16	50000	14	id:f:0.962616	kc:f:0.645041
+SUPER_2	24463642	10850000	15200000	-	SUPER_1	24739779	9359376	13681754	43	4350000	22	id:f:0.99353	kc:f:0.970742
+SUPER_2	24463642	15200000	19950000	-	SUPER_1	24739779	4612591	9293719	37	4750000	23	id:f:0.99447	kc:f:0.999766
+SUPER_2	24463642	20000000	24250000	-	SUPER_1	24739779	306879	4608250	44	4301371	23	id:f:0.995415	kc:f:0.990297
+SUPER_2	24463642	24250000	24300000	+	SUPER_1	24739779	272287	322287	28	50000	18	id:f:0.982711	kc:f:0.859448
+SUPER_2	24463642	24300000	24463642	-	SUPER_1	24739779	86973	246795	43	163642	25	id:f:0.996852	kc:f:0.926126