Mercurial > repos > iuc > vgp_split_agp
changeset 0:fc30c955f2ac draft default tip
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/main/tools/vgp_processcuration commit c25e877636f68656a0005883efb0f03b5ffd6b0c
line wrap: on
line diff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/macros.xml Wed Jan 07 12:48:27 2026 +0000 @@ -0,0 +1,56 @@ +<macros> + <xml name="requirements"> + <requirements> + <requirement type="package" version="@TOOL_VERSION@">vgp-processcuration</requirement> + <yield/> + </requirements> + </xml> + <token name="@TOOL_VERSION@">1.0</token> + <token name="@PROFILE@">21.09</token> + <xml name="edam_ontology"> + <edam_topics> + <edam_topic>topic_0622</edam_topic> <!-- Genomics --> + <edam_topic>topic_3797</edam_topic> <!-- Genome assembly --> + </edam_topics> + </xml> + <xml name="xrefs"> + <xrefs> + <xref type="bio.tools">vgp-processcuration</xref> + </xrefs> + </xml> + <xml name="citations"> + <citations> + <citation type="bibtex"> +@misc{vgl_curation, + author = {VGL-Hub}, + title = {VGL Curation - ProcessCuration toolkit for genome assembly submission}, + year = {2025}, + url = {https://github.com/vgl-hub/vgl-curation}, +} + </citation> + </citations> + </xml> + <xml name="help_common"> + <![CDATA[ +**About ProcessCuration** + +ProcessCuration is a Python-based toolkit designed to process manually curated genome assemblies for submission. +It reconciles AGP files (A Golden Path) created in PretextView with genome assembly FASTAs, preparing them for +database submission through renaming, reorienting, and sorting operations. + +The toolkit is part of the VGP (Vertebrate Genomes Project) curation pipeline and works in conjunction with +tools like gfastats and MashMap. + +**Input Naming Convention** + +Scaffolds must follow the naming pattern before curation: +- Haplotype 1: H1.scaffold_X +- Haplotype 2: H2.scaffold_X + +**More Information** + +- GitHub repository: https://github.com/vgl-hub/vgl-curation +- VGP Genome Assembly Pipeline: https://vertebrategenomesproject.org/ + ]]> + </xml> +</macros>
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/split_agp.xml Wed Jan 07 12:48:27 2026 +0000 @@ -0,0 +1,100 @@ +<tool id="vgp_split_agp" name="VGP Split AGP" version="@TOOL_VERSION@+galaxy0" profile="@PROFILE@"> + <description>Correct AGP files and split haplotypes</description> + <macros> + <import>macros.xml</import> + </macros> + <expand macro="xrefs"/> + <expand macro="requirements"/> + <command detect_errors="exit_code"><![CDATA[ + split_agp + -f '$fasta' + -a '$agp' + -o './' + ]]></command> + <inputs> + <param name="fasta" type="data" format="fasta,fasta.gz" label="Assembly FASTA file" + help="Input assembly FASTA file containing both haplotypes." /> + <param name="agp" type="data" format="tabular" label="Curated AGP file" + help="Input curated AGP file created in PretextView with haplotype markers (Hap_1/H1 and Hap_2/H2)." /> + </inputs> + <outputs> + <data name="corrected_agp" format="tabular" from_work_dir="corrected.agp" + label="${tool.name} on ${on_string}: Corrected AGP"/> + + <!-- Haplotype 1 outputs --> + <data name="hap1_agp" format="tabular" from_work_dir="Hap_1/hap1.agp" label="${tool.name} on ${on_string}: Hap1 AGP"/> + <data name="hap1_unlocs_no_hapdups" format="tabular" from_work_dir="Hap_1/hap.unlocs.no_hapdups.agp" label="${tool.name} on ${on_string}: Hap1 Unlocs without haplotig AGP"/> + <data name="hap1_haplotigs" format="tabular" from_work_dir="Hap_1/haplotigs.agp" label="${tool.name} on ${on_string}: Hap1 Haplotigs AGP"/> + + <!-- Haplotype 2 outputs --> + <data name="hap2_agp" format="tabular" from_work_dir="Hap_2/hap2.agp" label="${tool.name} on ${on_string}: Hap2 AGP"/> + <data name="hap2_unlocs_no_hapdups" format="tabular" from_work_dir="Hap_2/hap.unlocs.no_hapdups.agp" label="${tool.name} on ${on_string}: Hap2 Unlocs without haplotigs AGP"/> + <data name="hap2_haplotigs" format="tabular" from_work_dir="Hap_2/haplotigs.agp" label="${tool.name} on ${on_string}: Hap2 Haplotigs AGP"/> + </outputs> + <tests> + <test expect_num_outputs="7"> + <param name="fasta" value="test_input.fasta.gz" ftype="fasta.gz"/> + <param name="agp" value="test_input.agp" ftype="tabular"/> + <output name="corrected_agp" file="expected_corrected.agp" ftype="tabular"/> + <output name="hap1_agp" file="expected_hap1.agp" ftype="tabular"/> + <output name="hap1_unlocs_no_hapdups" file="expected_hap1_unlocs_no_hapdups.agp" ftype="tabular"/> + <output name="hap1_haplotigs" file="expected_hap1_haplotigs.agp" ftype="tabular"/> + <output name="hap2_agp" file="expected_hap2.agp" ftype="tabular"/> + <output name="hap2_unlocs_no_hapdups" file="expected_hap2_unlocs_no_hapdups.agp" ftype="tabular"/> + <output name="hap2_haplotigs" file="expected_hap2_haplotigs.agp" ftype="tabular"/> + </test> + </tests> + <help><![CDATA[ +**What it does** + +split_agp corrects AGP files for sequence length discrepancies, splits haplotypes into separate files, +assigns unlocalized sequences, and removes haplotig duplications. + +This tool performs three sequential operations: + +1. **AGPcorrect**: Validates sequence lengths from FASTA against AGP coordinates, adjusting start/end positions +2. **hap_split**: Segregates lines containing haplotype markers into separate directories (Hap_1 and Hap_2) +3. **unloc**: Processes metadata tags, renames unloc scaffolds with sequential numbering, removes haplotigs + +**Inputs** + +- **Assembly FASTA file**: FASTA file containing both haplotypes (may be gzip-compressed) +- **Curated AGP file**: Tab-delimited AGP file with haplotype markers (Hap_1/H1 or Hap_2/H2) + +**Outputs** + +- **Corrected AGP**: Length-validated AGP file with corrected coordinates +- **Hap1 AGP**: Haplotype 1 AGP file +- **Hap1 Unlocs No Hapdups**: Haplotype 1 AGP with unlocalized sequences assigned and haplotigs removed +- **Hap1 Haplotigs**: Removed duplicate haplotigs from Haplotype 1 +- **Hap2 AGP**: Haplotype 2 AGP file +- **Hap2 Unlocs No Hapdups**: Haplotype 2 AGP with unlocalized sequences assigned and haplotigs removed +- **Hap2 Haplotigs**: Removed duplicate haplotigs from Haplotype 2 + +**Input Naming Requirements** + +⚠️ **Important**: Scaffolds in the input FASTA must follow this naming convention: +- Haplotype 1: H1.scaffold_X +- Haplotype 2: H2.scaffold_X + +This naming pattern is required before manual curation in PretextView. + +**Next Steps** + +After running split_agp, use the gfastats tool to sort each haplotype: + +1. Sort Haplotype 1: gfastats with Hap1 Unlocs No Hapdups AGP +2. Sort Haplotype 2: gfastats with Hap2 Unlocs No Hapdups AGP + +Then proceed to the chromosome_assignment tool to assign chromosome-level names. + +.. class:: infomark + +**More Information** + +This tool is part of the VGP ProcessCuration pipeline for preparing curated genome assemblies for submission. + +<expand macro="help_common"/> + ]]></help> + <expand macro="citations"/> +</tool>
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/expected_corrected.agp Wed Jan 07 12:48:27 2026 +0000 @@ -0,0 +1,4 @@ +Scaffold_33 1 4414 1 W scaffold_16.hap1 1 4414 + Painted Hap_1 +Scaffold_34 1 4303 1 W scaffold_17.hap2 1 4303 + Painted Hap_2 +Scaffold_35 1 4409 1 W scaffold_17.hap1 1 4409 + Painted Hap_1 +Scaffold_36 1 4299 1 W scaffold_16.hap2 1 4299 + Painted Hap_2
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/expected_hap1.agp Wed Jan 07 12:48:27 2026 +0000 @@ -0,0 +1,2 @@ +Scaffold_33 1 4414 1 W scaffold_16.hap1 1 4414 + Painted Hap_1 +Scaffold_35 1 4409 1 W scaffold_17.hap1 1 4409 + Painted Hap_1
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/expected_hap1_chr_level.fa Wed Jan 07 12:48:27 2026 +0000 @@ -0,0 +1,310 @@ +>SUPER_1 +CCCACACCCACCCCACCCCACCCCCACCCCCACCCCCCACACCCCACCCCACCCCACCCC +CACCCCTACCCCCCCACCCCCAACCCACCCCCACCCACCCACCCCTCACCCCACCCTACC +CCCAACCCCTCCCCCACCCCACCCAACCCACCCCTACCCTAACCCTAACCCTAACCCTAC +CCCTAACCTACCCTACCCTACCCTACCCACCCTAACCCTACCCTAACCCTAACCCTAACC +CCTAACCCTAACCCTACCCTAACCCTAACCCTAACCCTAACCCTACCCCTAACCCTAACC +CTAACCCTAACCCTAACCCTACCCCTAACCCTAACCCTAACCCTACCCAACCCTACCCTA +ACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTA +ACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTA +ACCCCCTAACCCTAACCCTAACCCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACC +CTAACCCTAACCCTAACCCTAACCCTAACCCTACCCTAACCCTAACCCTAACCCTAACCC +TAACCCTACCCTAACCCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCC +CTAACCCTAACCCTAACCCTAACCCTAACCCTACCCTAACCCTAACCCTAACCCTAACCC +TAACCCTAACCCTAAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACC +CTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACC +CCCTAACCCTAACCCTAACCCTACCCTACCCTAACCCTAACCCTAACCCTAACCCCTAAC +CCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCCTAACCCTAACCCTAA +CCCTAACCCTAACCCTAACCCTACCCTAACCCTAACCCTAACCCTAACCCCCCCCCCCTA +ACCCTACCCTAACCCCTAACCCTACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAA +CCCTAACCCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCCC +CTAACCCCTAACCCTACCCTAACCCTAACCCTAACCCTAACCCTACCCTAACCCTACCCT +AACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCCTAACCC +TAACCCTACCCTAACCCTAACCCCTAACCCTAACCCTAACCCTAACCCCTAACCCACTCG +CCAGGAATACTGGGGCCGGGGGGACAGGCGGTATGCGGGTTGGATGGACCGTGCACCTTC +CTTCCCTGCTTGGGGAGGGACTCGGACCCGATTCCCTAACCCTAACCCTAACCCTTAATC +TAACCCTAACCCCCCTAACCCTAACCCGCCACTGACACTAACCCTCTCCCTGACACTAAC +CCTGACCATAACCACTTACTACCCACTTGCCAAACCATAACCCTTACCTTTGCCTAAGGT +TACTACCCACAAGGGTTACCATTTTCAGACATCGGAAGGGGGGTCCAAACCACTCGGGGG +ACCATGAAACGTGCTCCTACACACTTTCTGGGGGACACTTTTGGCCTTTGCCCAAGCGTA +ACCCTTACCTTTGCCTACCTTTACTACCCACAAGGTTTACCATTTTCATACATTCAAAGG +GGGGTCCAAACGACTCAGGGGGCTCTGAAACGTGCTCCTAGACACTTTCTGGGGGACACT +TTTGGGCTATGCCACTTTGTCATATTATCACACTTTTCCATATTCCCATACACATACATG +GGAATATTAATATGGCCATAACTTTTGAACGGAACATCACAGAGCTTCAGGACCACCACC +GTTGGACTCAGGGTACATCAAATAGGGGGGGTAGACAAACTTTCAACCTTCTAGCTCCAA +AAAAAATCTTCAGCATTTTTGCTGACATCAGCCTTTTCACCCTTAATCTACCCCCCCCGC +ACCCCCCCCAACGCCGCCACTGACACTAACCCTCTCCCTGACACTAACCCTGACCATAAC +CACTTACTACCCACTTGCCAAACCGTAACCCTTACCTTTGCCTAAGGTTACTACCCACAA +GGGTTACCATTTTCAGACATCGGAAGGGGGGTCCAAACCACTCGGGGGACCATGAAACGT +GCTCCTACACACTTTCTGGGGGACACTTTTGGCCTTTGCCCAAGCGTAACCCTTACCTTT +GCCTACCTTTACTACCCACAAGCTTTACCATTTTCATACATCGGAAGGGGGGTCCAAACC +ACTCGGGGGACCATGAAACGTGCTCCTACACACTTTCTGGGGGACACTTTTGGGCTATGG +CACTTTGTCATATTATCACACTTTTCCATATTCCCATACACATACATGGGAATATTAATA +TGGCCATAACTTTTGAACGGAACATCACAGAGCTTCAGGACCACCACCGTTGGACTCAGG +GTACATCAAATAGGGGGGGTAGACAAACTTTCAACCTTCTAGCTCCAAATAAAAAGTTCG +GCAACTTTTGCCGAATCAGCCTTTTCACCCTTAATCTAACCCTAACCCCTAACCCCTAAC +CCTAACCCTAACCCCCCCCCCTAACCCTAACCCTAACCCTAACCCCCTAACCCAAAAACA +GTACTAAACTTAAAGAACTACAAACAAACTATGTATCCCTGGACTGGGTGGCGTAGGGAC +TGGTGTCCCCAACGCACTCGCCAGGAATACTGGGGCCGGGGGGACAGGCGGTATGCGGGT +TGGATGGACCGTGCACCTTCCTTCCCTGCTTGGGGAGGGACTCGGACCCGATTCCCTAAC +CCTAACCCTAACCCTTAATCTAACCCTAACCCCCCTAACCCTAACCCGCCACTGACACTA +ACCCTCTCCCTGACACTAACCCTGACCATAACCACTTACTACCCACTTGCCAAACCATAA +CCCTTACCTTTGCCTAAGGTTACTACCCACAAGGGTTACCATTTTCAGACATCGGAAGGG +GGGTCCAAACCACTCGGGGGACCATGAAACGTGCTCCTACACACTTTCTGGGGGACACTT +TTGGCCTTTGCCCAAGCGTAACCCTTACCTTTGCCTACCTTTACTACCCACAAGGTTTAC +CATTTTCATACATTCAAAGGGGGGTCCAAACGACTCAGGGGGCTCTGAAACGTGCTCCTA +GACACTTTCTGGGGGACACTTTTGGGCTATGCCACTTTGTCATATTATCACACTTTTCCA +TATTCCCATACACATACATGGGAATATTAATATGGCCATAACTTTTGAACGGAACATCAC +AGAGCTTCAGGACCACCACCGTTGGACTCAGGGTACATCAAATAGGGGGGGTAGACAAAC +TTTCAACCTTCTAGCTCCAAAAAAAATCTTCAGCATTTTTGCTGACATCAGCCTTTTCAC +CCTTAATCTACCCCCCCCGCACCCCCCCCAACGCCGCCACTGACACTAACCCTCTCCCTG +ACACTAACCCTGACCATAACCACTTACTACCCACTTGCCAAACCGTAACCCTTACCTTTG +CCTAAGGTTACTACCCACAAGGGTTACCATTTTCAGACATCGGAAGGGGGGTCCAAACCA +CTCGGGGGACCATGAAACGTGCTCCTACACACTTTCTGGGGGACACTTTTGGCCTTTGCC +CAAGCGTAACCCTTACCTTTGCCTACCTTTACTACCCACAAGCTTTACCATTTTCATACA +TCGGAAGGGGGGTCCAAACCACTCGGGGGACCATGAAACGTGCTCCTACACACTTTCTGG +GGGACACTTTTGGGCTATGGCACTTTGTCATATTATCACACTTTTCCATATTCCCATACA +CATACATGGGAATATTAATATGGCCATAACTTTTGAACGGAACATCACAGAGCTTCAGGA +CCACCACCGTTGGACTCAGGGTACATCAAATAGGGGGGGTAGACAAACTTTCAACCTTCT +AGCTCCAAATAAAAAGTTCGGCAACTTTTGCCGAATCAGCCTTTTCACCCTTAATCTAAC +CCTACCCTAACTTTTGCCGAATCAGCCTTTTCACCCTTAATCTAACCCTAACCCTAACCC +CTAACCCTAACCCTACCCCCCCCCACACCCCCCCAACGCCACCACTGACACTAACCCTCT +CCCTGACACTAACCCTGACCATAACCACTTACTACCCACTTGCCAAACCGTAACCCTTAC +CTTTGCCTAAGGTTACTACCCACAAGGGTTACCATTTTCAGACATCGGAAGGGGGGTCCA +AACCACTCGGGGGACCATGAAACGTGCTCCTACACACTTTCTGGGGGACACTTTTGGCCT +TTGCCCAAGCGTAACCCTTACCTTTGCCTAGGTTTACTACCCACAAGGTTTACAATTTTC +ATACATTCAAAGGGGGGTCCAAACGACTCAGGGGGCTCTGAAACGTGCTCCTAGACACTT +TCTGGGGGACACTTTTGGGCTATGCCACTTTGTCATATTATCACACTTTTCCATATTCCC +ATACACATACATGGGAATATTAATATGGCCATAACTTTTGAACGGAACATCACAGAGCTT +CAGGACCACCACCGTTGGACTCAGGGTACATCAAATAGGGGGGGTAGACAAACTTTCAAC +CTTCTAGCTCCAAAAAAAATCTTCAGCATTTTTGCTGACATCAGCCTTTTCACCCTTAAT +CTAACGGAACATCACAGAGCTTCAGGACCACCACCGTTGGACTCAGGGTACATCAAATAG +GGGGGGTAGACAAACTTTCAACCTTCTAGCTCCAAATAAAAAGTTTGTCCCTTTTTGCCC +GAATCAGCCTTTTCACCCTTAATCTAACCCCCTAACCCTAACCCTAACCCTAACCCTAAC +CCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCCCTAACCCTAACCCTAACCCTA +ACCCTAACCCTAACCCTAACCCTACCCTACCCTAACCCTAACCCTAACCCTAACCCTAAC +CCTAACCCTGACCACCACCGTTGGACTCAGGGTACATCAAATAGGGGGGGTAGACAAACT +TTCAACCTTCTAGCTCCAAATAAAAAGTTTGTCCCTTTTTGCCCGAATCAGCCTTTTCAC +CCTTAATCTAACCCTAACCCTAACCCAAACTTTCAACCTTCTAGCTCCAAATAAAAAGTT +CGGCAACTTTTGCCGAATCAGCCTTTTCACCCTTAATCTAACCCTAACCCCTAACCCCTA +ACCCTAACCCTAACCCCCCCCCCTAACCCTAACCCTAACCCTAACCCCCTAACCCAAAAA +CAGTACTAAACTTAAAGAACTACAAACAAACTATGTATCCCTGGACTGGGTGGCGTAGGG +ACTGGTGTCCCCAACGCACTCGCCAGGAATACTGGGGCCGGGGGGACAGGCGGTATGCGG +GTTGGATGGACCGTGCACCTTCCTTCCCTGCTTGGGGAGGGACTCGGACCCGATTCCCTA +ACCCTAACCCTAACCCTTAATCTAACCCTAACCCCCCTAACCCTAACCCGCCACTGACAC +TAACCCTCTCCCTGACACTAACCCTGACCATAACCACTTACTACCCACTTGCCAAACCAT +AACCCTTACCTTTGCCTAAGGTTACTACCCACAAGGGTTACCATTTTCAGACATCGGAAG +GGGGGTCCAAACCACTCGGGGGACCATGAAACGTGCTCCTACACACTTTCTGGGGGACAC +TTTTGGCCTTTGCCCAAGCGTAACCCTTACCTTTGCCTACCTTTACTACCCACAAGGTTT +ACCATTTTCATACATTCAAAGGGGGGTCCAAACGACTCAGGGGGCTCTGAAACGTGCTCC +TAGACACTTTCTGGGGGACACTTTTGGGCTATGCCACTTTGTCATATTATCACACTTTTC +CATATTCCCATACACATACATGGGAATATTAATATGGCCATAACTTTTGAACGGAACATC +ACAGAGCTTCAGGACCACCACCGTTGGACTCAGGGTACATCAAATAGGGGGGGTAGACAA +ACTTTCAACCTTCTAGCTCCAAAAAAAATCTTCAGCATTTTTGCTGACATCAGCCTTTTC +ACCCTTAATCTACCCCCCCCGCACCCCCCCCAACGCCGCCACTGACACTAACCCTCTCCC +TGACACTAACCCTGACCATAACCACTTACTACCCACTTGCCAAACCGTAACCCTTACCTT +TGCCTAAGGTTACTACCCACAAGGGTTACCATTTTCAGACATCGGAAGGGGGGTCCAAAC +CACTCGGGGGACCATGAAACGTGCTCCTACACACTTTCTGGGGGACACTTTTGGCCTTTG +CCCAAGCGTAACCCTTACCTTTGCCTACCTTTACTACCCACAAGCTTTACCATTTTCATA +CATCGGAAGGGGGGTCCAAACCACTCGGGGGACCATGAAACGTGCTCCTACACACTTTCT +GGGGGACACTTTTGGGCTATGGCACTTTGTCATATTATCACACTTTTCCATATTCCCATA +CACATACATGGGAATATTAATATGGCCATAACTTTTGAACGGAACATCACAGAGCTTCAG +GACCACCACCGTTGGACTCAGGGTACATCAAATAGGGGGGGTAGACAAACTTTCAACCTT +CTAGCTCCAAATAAAAAGTTCGGCAACTTTTGCCGAATCAGCCTTTTCACCCTTAATCTA +ACCCTAACCCCTAACCCCTAACCCTAACCCTAACCCCCCCCCCTAACCCTAACCCTAACC +CTAACCCCCTAACCCAAAAACAGTACTAAACTTAAAGAACTACAAACAAACTATGTATCC +CTGGACTGGGTGGCGTAGGGACTGGTGTCCCCAACGCACTCGCCAGGAATACTGGGGCCG +GGGGGACAGGCGGTATGCGGGTTGGATGGACCGTGCACCTTCCTTCCCTGCTTGGGGAGG +GACTCGGACCCGATTCCCTAACCCTAACCCTAACCCTTAATCTAACCCTAACCCCCCTAA +CCCTAACCCGCCACTGACACTAACCCTCTCCCTGACACTAACCCTGACCATAACCACTTA +CTACCCACTTGCCAAACCATAACCCTTACCTTTGCCTAAGGTTACTACCCACAAGGGTTA +CCATTTTCAGACATCGGAAGGGGGGTCCAAACCACTCGGGGGACCATGAAACGTGCTCCT +ACACACTTTCTGGGGGACACTTTTGGCCTTTGCCCAAGCGTAACCCTTACCTTTGCCTAC +CTTTACTACCCACAAGGTTTACCATTTTCATACATTCAAAGGGGGGTCCAAACGACTCAG +GGGGCTCTGAAACGTGCTCCTAGACACTTTCTGGGGGACACTTTTGGGCTATGCCACTTT +GTCATATTATCACACTTTTCCATATTCCCATACACATACATGGGAATATTAATATGGCCA +TAACTTTTGAACGGAACATCACAGAGCTTCAGGACCACCACCGTTGGACTCAGGGTACAT +CAAATAGGGGGGGTAGACAAACTTTCAACCTTCTAGCTCCAAAAAAAATCTTCAGCATTT +TTGCTGACATCAGCCTTTTCACCCTTAATCTAACCCTAACCCCCTAACCCAAAAACAGTA +CTAAACTTAAAGAACTACAAACAAACTATGTATCCCTGGACTGGGTGGCGTAGGGACTGG +TGTCCCCAACGCACTCGCCAGGAATACTGGGGCCGGGGGGACAGGCGGTATGCGGGTTGG +ATGGACCGTGCACCTTCCTTCCCTGCTTGGGGAGGGACTCGGACCCGATTCCCTAACCCT +AACCCTAACCCTTAATCTAACCCTAACCCCCCTAACCCTAACCCGCCACTGACACTAACC +CTCTCCCTGACACTAACCCTGACCATAACCACTTACTACCCACTTGCCAAACCATAACCC +TTACCTTTGCCTAAGGTTACTACCCACAAGGGTTACCATTTTCAGACATCGGAAGGGGGG +TCCAAACCACTCGGGGGACCATGAAACGTGCTCCTACACACTTTCTGGGGGACACTTTTG +GCCTTTGCCCAAGCGTAACCCTTACCTTTGCCTACCTTTACTACCCACAAGGTTTACCAT +TTTCATACATTCAAAGGGGGGTCCAAACGACTCAGGGGGCTCTGAAACGTGCTCCTAGAC +ACTTTCTGGGGGACACTTTTGGGCTATGCCACTTTGTCATATTATCACACTTTTCCATAT +TCCCATACACATACATGGGAATATTAATATGGCCATAACTTTTGAACGGAACATCACAGA +GCTTCAGGACCACCACCGTTGGACTCAGGGTACATCAAATAGGGGGGTAGACAAACTTTC +AACCTTCTAGCTCCAAAAAAAATCTTCAGCATTTTTGCTGACATCAGCCTTTTCACCCTT +AATCTACCCCCCCCGCACCCCCCCCAACGCCGCCACTGACACTAACCCTCTCCCTGACAC +TAACCCTGACCATAACCACTTACTACCCACTTGCCAAACCGTAACCCTTACCTTTGCCTA +AGGTTACTACCCACAAGGGTTACCATTTTCAGACATCGGAAGGGGGGTCCAAACCACTCG +GGGGACCATGAAACGTGCTCCTACACACTTTCTGGGGGACACTTTTGGCCTTTGCCCAAG +CGTAACCCTTACCTTTGCCTACCTTTACTACCCACAAGCTTTACCATTTTCATACATCGG +AAGGGGGGTCCAAACCACTCGGGGGACCATGAAACGTGCTCCTACACACTTTCTGGGGGA +CACTTTTGGGCTATGGCACTTTGTCATATTATCACACTTTTCCATATTCCCATACACATA +CATGGGAATATTAATATGGCCATAACTTTTGAACGGAACATCACAGAGCTTCAGGACCAC +CACCGTTGGACTCAGGGTACATCAAATAGGGGGGGTAGACAAACTTTCAACCTTCTAGCT +CCAAATAAAAAGTTCGGCAACTTTTGCCGAATCAGCCTTTTCACCCTTAATCTAACCCTA +ACCCCTAACCCCTAACCCTAACCCTAACCCCCCCCCCTAACCCTAACCCTAACCCTAACC +CCCTAACCCAAAAACAGTACTAAACTTAAAGAACTACAAACAAACTATGTATCCCTGGAC +TGGGTGGCGTAGGGACTGGTGTCCCCAACGCACTCGCCAGGAATACTGGGGCCGGGGGGA +CAGGCGGTATGCGGGTTGGATGGACCGTGCACCTTCCTTCCCTGCTTGGGGAGGGACTCG +GACCCGATTCCCTAACCCTAACCCTAACCCTTAATCTAACCCTAACCCCCCTAACCCTAA +CCCGCCACTGACACTAACCCTCTCCCTGACACTAACCCTGACCATAACCACTTACTACCC +ACTTGCCAAACCATAACCCTTACCTTTGCCTAAGGTTACTACCCACAAGGGTTACCATTT +TCAGACATCGGAAGGGGGGTCCAAACCACTCGGGGGACCATGAAACGTGCTCCTACACAC +TTTCTGGGGGACACTTTTGGCCTTTGCCCAAGCGTAACCCTTACCTTTGCCTACCTTTAC +TACCCACAAGGTTTACCATTTTCATACATTCAAAGGGGGGTCCAAACGACTCAGGGGGCT +CTGAAACGTGCTCCTAGACACTTTCTGGGGGACACTTTTGGGCTATGCCACTTTGTCATA +TTATCACACTTTTCCATATTCCCATACACATACATGGGAATATTAATATGGCCATAACTT +TTGAACGGAACATCACAGAGCTTCAGGACCACCACCGTTGGACTCAGGGTACATCAAATA +GGGGGGGTAGACAAACTTTCAACCTTCTAGCTCCAAAAAAAATCTTCAGCATTTTTGCTG +ACATCAGCCTTTTCACCCTTAATCTACCCCCCCCGCACCCCCCCCAACGCCGCCACTGAC +ACTAACCCTCTCCCTGACACTAACCCTGACCATAACCACTTACTACCCACTTGCCAAACC +GTAACCCTTACCTTTGCCTAAGGTTACT +>SUPER_2 +AACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGT +TAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTC +CGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTG +TCATAGAATGACATTTCCACTTTAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCA +TGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTG +CTTTTCTCGCTCAAAAAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGA +TTTTATTTGTCAAACTGTCATAGAATGACGCGCTAATTTCCACTTGAGTAAACATCAATT +CTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAA +AGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAA +ATGACAGAATATGAGTATTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGA +CATTTCCACTTGAGAAACATCAATTCTTTGCATGTTTTTGAAGGACAGCATGGTTTATTT +TGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGC +TCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTA +TTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATG +TTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGT +ACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGA +ATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCC +ACTTTAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCG +TGTTGAGTTAGTGTGAAAAGTGAGGTATATGTTCATTTTGTGCTTTTCTCGCTCAAATAG +CGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTG +TCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAA +GGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGACATGTTCA +TTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTA +TTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAA +ACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTT +AGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCC +GACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGT +CATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCAT +GGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTCATTTTGTGC +TTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGAT +TCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTTAGAAACATCAAT +TCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAA +AAGTGAGGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAA +AATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAAT +GACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATT +TTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCG +CTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGT +ATTTATTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATG +TTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGT +ATATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGA +ATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCC +ACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCG +TGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAG +CGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTG +TCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAA +GGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTC +ATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGT +ATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGA +AACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGT +TAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGAGTTATTC +CGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTG +TCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCA +TGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTCATTTTGTG +CTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGA +TTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAA +TTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGA +AAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGA +AAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAA +TGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTAT +TTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTCATTTTGTGCTTTTCTC +GCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTG +TATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCA +TGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCA +GTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACA +GAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTT +CCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATT +CGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTCATTTTGTGCTTTTCTCGCTCAAAT +AGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATT +TGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTG +AAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGT +TCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGA +GTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATCACATTTCCACTTGA +GAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGA +GTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGAGTTAT +TCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAAC +TGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAG +CATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTCATTTTG +TGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTA +GATTCATTTGTATTTATTTGTCAAACTGTCATAGAATTATTCCGACCTGAAAATGACAGA +ATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCC +ACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCG +TGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAG +CGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTG +TCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAA +GGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTC +ATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGT +ATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGA +AACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGT +TAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTC +CGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTG +TCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCA +TGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTCATTTTGTG +CTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGA +TTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAA +TTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGA +AAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGA +AAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAA +TGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTAT +TTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTCATTTTGTGCTTTTCTC +GCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTG +TATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCA +TGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCA +GTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGAGTTATTCCGACCTGAAAATGACA +GAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTT +CCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATT +CGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTCATTTTGTGCTTTTCTCGCTCAAAT +AGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATT +TGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTG +AAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTACATGT +TCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGA +GTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGA +GAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGA +GTTAGTGTGAAAAGTGCAGTATATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTAT +TCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAAC +TGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAG +CATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTCATTTTG +TGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTA +GATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTTAGAAACATC +AATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGT +GAAAAGTGCAGTATATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCT +GAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAG +AATGACATTTCCACTTTAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTT +ATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGAGGTACATGTTCATTTTGTGCTTTTC +TCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATT +TGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTG +CATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTG +CAGTATATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGA +CAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACAT +TTCCACTTTAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAA +TTCGTGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAA +ATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTA +TTTGTCAAACTGTCATAGAATGACATTTCCACTTTAGAAACATCAATTCTTGCATGTTTT +TGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGAGGTACAT +GTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATAT +GAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTT +TAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTT +GAGTTAGTGTGAAAAGTGAGGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTT +ATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAA +ACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGAC +AGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTT +TGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTT
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/expected_hap1_inter_chr.tsv Wed Jan 07 12:48:27 2026 +0000 @@ -0,0 +1,2 @@ +Scaffold_33 SUPER_1 +Scaffold_35 SUPER_2
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/expected_hap1_unlocs_no_hapdups.agp Wed Jan 07 12:48:27 2026 +0000 @@ -0,0 +1,2 @@ +Scaffold_33 1 4414 1 W scaffold_16.hap1 1 4414 + Painted Hap_1 +Scaffold_35 1 4409 1 W scaffold_17.hap1 1 4409 + Painted Hap_1
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/expected_hap2.agp Wed Jan 07 12:48:27 2026 +0000 @@ -0,0 +1,2 @@ +Scaffold_34 1 4303 1 W scaffold_17.hap2 1 4303 + Painted Hap_2 +Scaffold_36 1 4299 1 W scaffold_16.hap2 1 4299 + Painted Hap_2
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/expected_hap2_inter_chr.tsv Wed Jan 07 12:48:27 2026 +0000 @@ -0,0 +1,2 @@ +Scaffold_36 SUPER_1 +Scaffold_34 SUPER_2
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/expected_hap2_unlocs_no_hapdups.agp Wed Jan 07 12:48:27 2026 +0000 @@ -0,0 +1,2 @@ +Scaffold_34 1 4303 1 W scaffold_17.hap2 1 4303 + Painted Hap_2 +Scaffold_36 1 4299 1 W scaffold_16.hap2 1 4299 + Painted Hap_2
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/expected_orientation.tsv Wed Jan 07 12:48:27 2026 +0000 @@ -0,0 +1,3 @@ + Hap_1 Hap_2 Main Orientation +0 SUPER_1 SUPER_2 - +1 SUPER_2 SUPER_1 -
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/expected_reversing_renaming.sak Wed Jan 07 12:48:27 2026 +0000 @@ -0,0 +1,4 @@ +RVCP SUPER_2_oldname +RVCP SUPER_1_oldname +RENAME SUPER_2_oldname SUPER_1 +RENAME SUPER_1_oldname SUPER_2
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/test_hap1_sorted.fa Wed Jan 07 12:48:27 2026 +0000 @@ -0,0 +1,4 @@ +>Scaffold_33 +CCCACACCCACCCCACCCCACCCCCACCCCCACCCCCCACACCCCACCCCACCCCACCCCCACCCCTACCCCCCCACCCCCAACCCACCCCCACCCACCCACCCCTCACCCCACCCTACCCCCAACCCCTCCCCCACCCCACCCAACCCACCCCTACCCTAACCCTAACCCTAACCCTACCCCTAACCTACCCTACCCTACCCTACCCACCCTAACCCTACCCTAACCCTAACCCTAACCCCTAACCCTAACCCTACCCTAACCCTAACCCTAACCCTAACCCTACCCCTAACCCTAACCCTAACCCTAACCCTAACCCTACCCCTAACCCTAACCCTAACCCTACCCAACCCTACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCCCTAACCCTAACCCTAACCCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTACCCTAACCCTAACCCTAACCCTAACCCTAACCCTACCCTAACCCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCCTAACCCTAACCCTAACCCTAACCCTAACCCTACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCCCTAACCCTAACCCTAACCCTACCCTACCCTAACCCTAACCCTAACCCTAACCCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTACCCTAACCCTAACCCTAACCCTAACCCCCCCCCCCTAACCCTACCCTAACCCCTAACCCTACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCCCCTAACCCCTAACCCTACCCTAACCCTAACCCTAACCCTAACCCTACCCTAACCCTACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCCTAACCCTAACCCTACCCTAACCCTAACCCCTAACCCTAACCCTAACCCTAACCCCTAACCCACTCGCCAGGAATACTGGGGCCGGGGGGACAGGCGGTATGCGGGTTGGATGGACCGTGCACCTTCCTTCCCTGCTTGGGGAGGGACTCGGACCCGATTCCCTAACCCTAACCCTAACCCTTAATCTAACCCTAACCCCCCTAACCCTAACCCGCCACTGACACTAACCCTCTCCCTGACACTAACCCTGACCATAACCACTTACTACCCACTTGCCAAACCATAACCCTTACCTTTGCCTAAGGTTACTACCCACAAGGGTTACCATTTTCAGACATCGGAAGGGGGGTCCAAACCACTCGGGGGACCATGAAACGTGCTCCTACACACTTTCTGGGGGACACTTTTGGCCTTTGCCCAAGCGTAACCCTTACCTTTGCCTACCTTTACTACCCACAAGGTTTACCATTTTCATACATTCAAAGGGGGGTCCAAACGACTCAGGGGGCTCTGAAACGTGCTCCTAGACACTTTCTGGGGGACACTTTTGGGCTATGCCACTTTGTCATATTATCACACTTTTCCATATTCCCATACACATACATGGGAATATTAATATGGCCATAACTTTTGAACGGAACATCACAGAGCTTCAGGACCACCACCGTTGGACTCAGGGTACATCAAATAGGGGGGGTAGACAAACTTTCAACCTTCTAGCTCCAAAAAAAATCTTCAGCATTTTTGCTGACATCAGCCTTTTCACCCTTAATCTACCCCCCCCGCACCCCCCCCAACGCCGCCACTGACACTAACCCTCTCCCTGACACTAACCCTGACCATAACCACTTACTACCCACTTGCCAAACCGTAACCCTTACCTTTGCCTAAGGTTACTACCCACAAGGGTTACCATTTTCAGACATCGGAAGGGGGGTCCAAACCACTCGGGGGACCATGAAACGTGCTCCTACACACTTTCTGGGGGACACTTTTGGCCTTTGCCCAAGCGTAACCCTTACCTTTGCCTACCTTTACTACCCACAAGCTTTACCATTTTCATACATCGGAAGGGGGGTCCAAACCACTCGGGGGACCATGAAACGTGCTCCTACACACTTTCTGGGGGACACTTTTGGGCTATGGCACTTTGTCATATTATCACACTTTTCCATATTCCCATACACATACATGGGAATATTAATATGGCCATAACTTTTGAACGGAACATCACAGAGCTTCAGGACCACCACCGTTGGACTCAGGGTACATCAAATAGGGGGGGTAGACAAACTTTCAACCTTCTAGCTCCAAATAAAAAGTTCGGCAACTTTTGCCGAATCAGCCTTTTCACCCTTAATCTAACCCTAACCCCTAACCCCTAACCCTAACCCTAACCCCCCCCCCTAACCCTAACCCTAACCCTAACCCCCTAACCCAAAAACAGTACTAAACTTAAAGAACTACAAACAAACTATGTATCCCTGGACTGGGTGGCGTAGGGACTGGTGTCCCCAACGCACTCGCCAGGAATACTGGGGCCGGGGGGACAGGCGGTATGCGGGTTGGATGGACCGTGCACCTTCCTTCCCTGCTTGGGGAGGGACTCGGACCCGATTCCCTAACCCTAACCCTAACCCTTAATCTAACCCTAACCCCCCTAACCCTAACCCGCCACTGACACTAACCCTCTCCCTGACACTAACCCTGACCATAACCACTTACTACCCACTTGCCAAACCATAACCCTTACCTTTGCCTAAGGTTACTACCCACAAGGGTTACCATTTTCAGACATCGGAAGGGGGGTCCAAACCACTCGGGGGACCATGAAACGTGCTCCTACACACTTTCTGGGGGACACTTTTGGCCTTTGCCCAAGCGTAACCCTTACCTTTGCCTACCTTTACTACCCACAAGGTTTACCATTTTCATACATTCAAAGGGGGGTCCAAACGACTCAGGGGGCTCTGAAACGTGCTCCTAGACACTTTCTGGGGGACACTTTTGGGCTATGCCACTTTGTCATATTATCACACTTTTCCATATTCCCATACACATACATGGGAATATTAATATGGCCATAACTTTTGAACGGAACATCACAGAGCTTCAGGACCACCACCGTTGGACTCAGGGTACATCAAATAGGGGGGGTAGACAAACTTTCAACCTTCTAGCTCCAAAAAAAATCTTCAGCATTTTTGCTGACATCAGCCTTTTCACCCTTAATCTACCCCCCCCGCACCCCCCCCAACGCCGCCACTGACACTAACCCTCTCCCTGACACTAACCCTGACCATAACCACTTACTACCCACTTGCCAAACCGTAACCCTTACCTTTGCCTAAGGTTACTACCCACAAGGGTTACCATTTTCAGACATCGGAAGGGGGGTCCAAACCACTCGGGGGACCATGAAACGTGCTCCTACACACTTTCTGGGGGACACTTTTGGCCTTTGCCCAAGCGTAACCCTTACCTTTGCCTACCTTTACTACCCACAAGCTTTACCATTTTCATACATCGGAAGGGGGGTCCAAACCACTCGGGGGACCATGAAACGTGCTCCTACACACTTTCTGGGGGACACTTTTGGGCTATGGCACTTTGTCATATTATCACACTTTTCCATATTCCCATACACATACATGGGAATATTAATATGGCCATAACTTTTGAACGGAACATCACAGAGCTTCAGGACCACCACCGTTGGACTCAGGGTACATCAAATAGGGGGGGTAGACAAACTTTCAACCTTCTAGCTCCAAATAAAAAGTTCGGCAACTTTTGCCGAATCAGCCTTTTCACCCTTAATCTAACCCTACCCTAACTTTTGCCGAATCAGCCTTTTCACCCTTAATCTAACCCTAACCCTAACCCCTAACCCTAACCCTACCCCCCCCCACACCCCCCCAACGCCACCACTGACACTAACCCTCTCCCTGACACTAACCCTGACCATAACCACTTACTACCCACTTGCCAAACCGTAACCCTTACCTTTGCCTAAGGTTACTACCCACAAGGGTTACCATTTTCAGACATCGGAAGGGGGGTCCAAACCACTCGGGGGACCATGAAACGTGCTCCTACACACTTTCTGGGGGACACTTTTGGCCTTTGCCCAAGCGTAACCCTTACCTTTGCCTAGGTTTACTACCCACAAGGTTTACAATTTTCATACATTCAAAGGGGGGTCCAAACGACTCAGGGGGCTCTGAAACGTGCTCCTAGACACTTTCTGGGGGACACTTTTGGGCTATGCCACTTTGTCATATTATCACACTTTTCCATATTCCCATACACATACATGGGAATATTAATATGGCCATAACTTTTGAACGGAACATCACAGAGCTTCAGGACCACCACCGTTGGACTCAGGGTACATCAAATAGGGGGGGTAGACAAACTTTCAACCTTCTAGCTCCAAAAAAAATCTTCAGCATTTTTGCTGACATCAGCCTTTTCACCCTTAATCTAACGGAACATCACAGAGCTTCAGGACCACCACCGTTGGACTCAGGGTACATCAAATAGGGGGGGTAGACAAACTTTCAACCTTCTAGCTCCAAATAAAAAGTTTGTCCCTTTTTGCCCGAATCAGCCTTTTCACCCTTAATCTAACCCCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTACCCTACCCTAACCCTAACCCTAACCCTAACCCTAACCCTAACCCTGACCACCACCGTTGGACTCAGGGTACATCAAATAGGGGGGGTAGACAAACTTTCAACCTTCTAGCTCCAAATAAAAAGTTTGTCCCTTTTTGCCCGAATCAGCCTTTTCACCCTTAATCTAACCCTAACCCTAACCCAAACTTTCAACCTTCTAGCTCCAAATAAAAAGTTCGGCAACTTTTGCCGAATCAGCCTTTTCACCCTTAATCTAACCCTAACCCCTAACCCCTAACCCTAACCCTAACCCCCCCCCCTAACCCTAACCCTAACCCTAACCCCCTAACCCAAAAACAGTACTAAACTTAAAGAACTACAAACAAACTATGTATCCCTGGACTGGGTGGCGTAGGGACTGGTGTCCCCAACGCACTCGCCAGGAATACTGGGGCCGGGGGGACAGGCGGTATGCGGGTTGGATGGACCGTGCACCTTCCTTCCCTGCTTGGGGAGGGACTCGGACCCGATTCCCTAACCCTAACCCTAACCCTTAATCTAACCCTAACCCCCCTAACCCTAACCCGCCACTGACACTAACCCTCTCCCTGACACTAACCCTGACCATAACCACTTACTACCCACTTGCCAAACCATAACCCTTACCTTTGCCTAAGGTTACTACCCACAAGGGTTACCATTTTCAGACATCGGAAGGGGGGTCCAAACCACTCGGGGGACCATGAAACGTGCTCCTACACACTTTCTGGGGGACACTTTTGGCCTTTGCCCAAGCGTAACCCTTACCTTTGCCTACCTTTACTACCCACAAGGTTTACCATTTTCATACATTCAAAGGGGGGTCCAAACGACTCAGGGGGCTCTGAAACGTGCTCCTAGACACTTTCTGGGGGACACTTTTGGGCTATGCCACTTTGTCATATTATCACACTTTTCCATATTCCCATACACATACATGGGAATATTAATATGGCCATAACTTTTGAACGGAACATCACAGAGCTTCAGGACCACCACCGTTGGACTCAGGGTACATCAAATAGGGGGGGTAGACAAACTTTCAACCTTCTAGCTCCAAAAAAAATCTTCAGCATTTTTGCTGACATCAGCCTTTTCACCCTTAATCTACCCCCCCCGCACCCCCCCCAACGCCGCCACTGACACTAACCCTCTCCCTGACACTAACCCTGACCATAACCACTTACTACCCACTTGCCAAACCGTAACCCTTACCTTTGCCTAAGGTTACTACCCACAAGGGTTACCATTTTCAGACATCGGAAGGGGGGTCCAAACCACTCGGGGGACCATGAAACGTGCTCCTACACACTTTCTGGGGGACACTTTTGGCCTTTGCCCAAGCGTAACCCTTACCTTTGCCTACCTTTACTACCCACAAGCTTTACCATTTTCATACATCGGAAGGGGGGTCCAAACCACTCGGGGGACCATGAAACGTGCTCCTACACACTTTCTGGGGGACACTTTTGGGCTATGGCACTTTGTCATATTATCACACTTTTCCATATTCCCATACACATACATGGGAATATTAATATGGCCATAACTTTTGAACGGAACATCACAGAGCTTCAGGACCACCACCGTTGGACTCAGGGTACATCAAATAGGGGGGGTAGACAAACTTTCAACCTTCTAGCTCCAAATAAAAAGTTCGGCAACTTTTGCCGAATCAGCCTTTTCACCCTTAATCTAACCCTAACCCCTAACCCCTAACCCTAACCCTAACCCCCCCCCCTAACCCTAACCCTAACCCTAACCCCCTAACCCAAAAACAGTACTAAACTTAAAGAACTACAAACAAACTATGTATCCCTGGACTGGGTGGCGTAGGGACTGGTGTCCCCAACGCACTCGCCAGGAATACTGGGGCCGGGGGGACAGGCGGTATGCGGGTTGGATGGACCGTGCACCTTCCTTCCCTGCTTGGGGAGGGACTCGGACCCGATTCCCTAACCCTAACCCTAACCCTTAATCTAACCCTAACCCCCCTAACCCTAACCCGCCACTGACACTAACCCTCTCCCTGACACTAACCCTGACCATAACCACTTACTACCCACTTGCCAAACCATAACCCTTACCTTTGCCTAAGGTTACTACCCACAAGGGTTACCATTTTCAGACATCGGAAGGGGGGTCCAAACCACTCGGGGGACCATGAAACGTGCTCCTACACACTTTCTGGGGGACACTTTTGGCCTTTGCCCAAGCGTAACCCTTACCTTTGCCTACCTTTACTACCCACAAGGTTTACCATTTTCATACATTCAAAGGGGGGTCCAAACGACTCAGGGGGCTCTGAAACGTGCTCCTAGACACTTTCTGGGGGACACTTTTGGGCTATGCCACTTTGTCATATTATCACACTTTTCCATATTCCCATACACATACATGGGAATATTAATATGGCCATAACTTTTGAACGGAACATCACAGAGCTTCAGGACCACCACCGTTGGACTCAGGGTACATCAAATAGGGGGGGTAGACAAACTTTCAACCTTCTAGCTCCAAAAAAAATCTTCAGCATTTTTGCTGACATCAGCCTTTTCACCCTTAATCTAACCCTAACCCCCTAACCCAAAAACAGTACTAAACTTAAAGAACTACAAACAAACTATGTATCCCTGGACTGGGTGGCGTAGGGACTGGTGTCCCCAACGCACTCGCCAGGAATACTGGGGCCGGGGGGACAGGCGGTATGCGGGTTGGATGGACCGTGCACCTTCCTTCCCTGCTTGGGGAGGGACTCGGACCCGATTCCCTAACCCTAACCCTAACCCTTAATCTAACCCTAACCCCCCTAACCCTAACCCGCCACTGACACTAACCCTCTCCCTGACACTAACCCTGACCATAACCACTTACTACCCACTTGCCAAACCATAACCCTTACCTTTGCCTAAGGTTACTACCCACAAGGGTTACCATTTTCAGACATCGGAAGGGGGGTCCAAACCACTCGGGGGACCATGAAACGTGCTCCTACACACTTTCTGGGGGACACTTTTGGCCTTTGCCCAAGCGTAACCCTTACCTTTGCCTACCTTTACTACCCACAAGGTTTACCATTTTCATACATTCAAAGGGGGGTCCAAACGACTCAGGGGGCTCTGAAACGTGCTCCTAGACACTTTCTGGGGGACACTTTTGGGCTATGCCACTTTGTCATATTATCACACTTTTCCATATTCCCATACACATACATGGGAATATTAATATGGCCATAACTTTTGAACGGAACATCACAGAGCTTCAGGACCACCACCGTTGGACTCAGGGTACATCAAATAGGGGGGTAGACAAACTTTCAACCTTCTAGCTCCAAAAAAAATCTTCAGCATTTTTGCTGACATCAGCCTTTTCACCCTTAATCTACCCCCCCCGCACCCCCCCCAACGCCGCCACTGACACTAACCCTCTCCCTGACACTAACCCTGACCATAACCACTTACTACCCACTTGCCAAACCGTAACCCTTACCTTTGCCTAAGGTTACTACCCACAAGGGTTACCATTTTCAGACATCGGAAGGGGGGTCCAAACCACTCGGGGGACCATGAAACGTGCTCCTACACACTTTCTGGGGGACACTTTTGGCCTTTGCCCAAGCGTAACCCTTACCTTTGCCTACCTTTACTACCCACAAGCTTTACCATTTTCATACATCGGAAGGGGGGTCCAAACCACTCGGGGGACCATGAAACGTGCTCCTACACACTTTCTGGGGGACACTTTTGGGCTATGGCACTTTGTCATATTATCACACTTTTCCATATTCCCATACACATACATGGGAATATTAATATGGCCATAACTTTTGAACGGAACATCACAGAGCTTCAGGACCACCACCGTTGGACTCAGGGTACATCAAATAGGGGGGGTAGACAAACTTTCAACCTTCTAGCTCCAAATAAAAAGTTCGGCAACTTTTGCCGAATCAGCCTTTTCACCCTTAATCTAACCCTAACCCCTAACCCCTAACCCTAACCCTAACCCCCCCCCCTAACCCTAACCCTAACCCTAACCCCCTAACCCAAAAACAGTACTAAACTTAAAGAACTACAAACAAACTATGTATCCCTGGACTGGGTGGCGTAGGGACTGGTGTCCCCAACGCACTCGCCAGGAATACTGGGGCCGGGGGGACAGGCGGTATGCGGGTTGGATGGACCGTGCACCTTCCTTCCCTGCTTGGGGAGGGACTCGGACCCGATTCCCTAACCCTAACCCTAACCCTTAATCTAACCCTAACCCCCCTAACCCTAACCCGCCACTGACACTAACCCTCTCCCTGACACTAACCCTGACCATAACCACTTACTACCCACTTGCCAAACCATAACCCTTACCTTTGCCTAAGGTTACTACCCACAAGGGTTACCATTTTCAGACATCGGAAGGGGGGTCCAAACCACTCGGGGGACCATGAAACGTGCTCCTACACACTTTCTGGGGGACACTTTTGGCCTTTGCCCAAGCGTAACCCTTACCTTTGCCTACCTTTACTACCCACAAGGTTTACCATTTTCATACATTCAAAGGGGGGTCCAAACGACTCAGGGGGCTCTGAAACGTGCTCCTAGACACTTTCTGGGGGACACTTTTGGGCTATGCCACTTTGTCATATTATCACACTTTTCCATATTCCCATACACATACATGGGAATATTAATATGGCCATAACTTTTGAACGGAACATCACAGAGCTTCAGGACCACCACCGTTGGACTCAGGGTACATCAAATAGGGGGGGTAGACAAACTTTCAACCTTCTAGCTCCAAAAAAAATCTTCAGCATTTTTGCTGACATCAGCCTTTTCACCCTTAATCTACCCCCCCCGCACCCCCCCCAACGCCGCCACTGACACTAACCCTCTCCCTGACACTAACCCTGACCATAACCACTTACTACCCACTTGCCAAACCGTAACCCTTACCTTTGCCTAAGGTTACT +>Scaffold_35 +AACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTTAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAAAAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTTTATTTGTCAAACTGTCATAGAATGACGCGCTAATTTCCACTTGAGTAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTTAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGAGGTATATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTTAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGAGGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGAGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATCACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGAGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGAGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTTAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTTAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGAGGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTATATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTTAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTTAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGAGGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTTAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGAGGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTTTAGATTCATTTGTATTTATTTGTCAAACTGTCATAGAATGACATTTCCACTTGAGAAACATCAATTCTTGCATGTTTTTGAAGGACAGCATGGTTTATTTTGAATTCGTGTTGAGTTAGTGTGAAAAGTGCAGTACATGTTCATTTTGTGCTTTTCTCGCTCAAATAGCGTTATTCCGACCTGAAAATGACAGAATATGAGTATTT \ No newline at end of file
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/test_hap1_unlocs_no_hapdups.agp Wed Jan 07 12:48:27 2026 +0000 @@ -0,0 +1,2 @@ +Scaffold_33 1 24739779 1 W scaffold_16.hap1 1 24739779 + Painted Hap_1 +Scaffold_35 1 24437540 1 W scaffold_17.hap1 1 24437540 + Painted Hap_1
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/test_input.agp Wed Jan 07 12:48:27 2026 +0000 @@ -0,0 +1,7 @@ +##agp-version 2.1 +# DESCRIPTION: Generated by PretextViewAI Version 1.0.0 +# HiC MAP RESOLUTION: 39904.841797 bp/texel +Scaffold_33 1 24741001 1 W scaffold_16.hap1 1 24741001 + Painted Hap_1 +Scaffold_34 1 24461668 1 W scaffold_17.hap2 1 24461668 + Painted Hap_2 +Scaffold_35 1 24461668 1 W scaffold_17.hap1 1 24461668 + Painted Hap_1 +Scaffold_36 1 24581382 1 W scaffold_16.hap2 1 24581382 + Painted Hap_2
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/test_mashmap.out Wed Jan 07 12:48:27 2026 +0000 @@ -0,0 +1,10 @@ +SUPER_1 24569333 0 24150000 - SUPER_2 24437540 419743 24421883 41 24150000 22 id:f:0.994373 kc:f:0.991464 +SUPER_1 24569333 24150000 24569333 - SUPER_2 24437540 12170 362135 5 419333 17 id:f:0.978691 kc:f:0.509185 +SUPER_2 24463642 0 10750000 - SUPER_1 24739779 13979195 24724929 41 10750000 22 id:f:0.994281 kc:f:0.996774 +SUPER_2 24463642 10750000 10800000 - SUPER_1 24739779 13806614 13856614 18 50000 15 id:f:0.967081 kc:f:0.518457 +SUPER_2 24463642 10800000 10850000 - SUPER_1 24739779 13929079 13979079 16 50000 14 id:f:0.962616 kc:f:0.645041 +SUPER_2 24463642 10850000 15200000 - SUPER_1 24739779 9359376 13681754 43 4350000 22 id:f:0.99353 kc:f:0.970742 +SUPER_2 24463642 15200000 19950000 - SUPER_1 24739779 4612591 9293719 37 4750000 23 id:f:0.99447 kc:f:0.999766 +SUPER_2 24463642 20000000 24250000 - SUPER_1 24739779 306879 4608250 44 4301371 23 id:f:0.995415 kc:f:0.990297 +SUPER_2 24463642 24250000 24300000 + SUPER_1 24739779 272287 322287 28 50000 18 id:f:0.982711 kc:f:0.859448 +SUPER_2 24463642 24300000 24463642 - SUPER_1 24739779 86973 246795 43 163642 25 id:f:0.996852 kc:f:0.926126
