Mercurial > repos > iuc > vsnp_build_tables
changeset 11:6b3b0f5858e6 draft default tip
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/vsnp commit c38fd63f7980c70390d104a73ba4c72b266444c3
author | iuc |
---|---|
date | Fri, 10 Jun 2022 06:11:08 +0000 |
parents | 152716f90b84 |
children | |
files | macros.xml test-data/add_zc_metrics.tabular test-data/add_zc_metrics1.tabular test-data/add_zc_metrics2.tabular test-data/add_zc_metrics3.tabular test-data/add_zc_metrics4.tabular test-data/add_zc_metrics5.tabular test-data/r1_seqkit_fx2tab1.tabular test-data/r1_seqkit_fx2tab2.tabular test-data/r1_seqkit_stats1.tabular test-data/r1_seqkit_stats2.tabular test-data/r2_seqkit_fx2tab2.tabular test-data/r2_seqkit_stats2.tabular test-data/samtools_idxstats.tabular test-data/samtools_idxstats1.tabular test-data/samtools_idxstats2.tabular test-data/samtools_idxstats3.tabular test-data/samtools_idxstats4.tabular test-data/samtools_idxstats5.tabular test-data/statistics_output1.tabular test-data/statistics_output2.tabular test-data/statistics_output3.tabular vsnp_add_zero_coverage.py vsnp_build_tables.py vsnp_build_tables.xml vsnp_get_snps.py vsnp_statistics.py |
diffstat | 27 files changed, 493 insertions(+), 294 deletions(-) [+] |
line wrap: on
line diff
--- a/macros.xml Mon Dec 06 18:28:04 2021 +0000 +++ b/macros.xml Fri Jun 10 06:11:08 2022 +0000 @@ -1,7 +1,6 @@ -<?xml version='1.0' encoding='UTF-8'?> <macros> - <token name="@TOOL_VERSION@">1.0</token> - <token name="@VERSION_SUFFIX@">2</token> + <token name="@TOOL_VERSION@">3.0.6</token> + <token name="@VERSION_SUFFIX@">0</token> <token name="@PROFILE@">21.01</token> <xml name="biopython_requirement"> <requirement type="package" version="1.79">biopython</requirement> @@ -13,7 +12,7 @@ <requirement type="package" version="3.0.9">openpyxl</requirement> </xml> <xml name="pandas_requirement"> - <requirement type="package" version="1.3.0">pandas</requirement> + <requirement type="package" version="1.4.2">pandas</requirement> </xml> <xml name="pysam_requirement"> <requirement type="package" version="0.15.4">pysam</requirement> @@ -24,6 +23,9 @@ <xml name="pyyaml_requirement"> <requirement type="package" version="5.4.1">pyyaml</requirement> </xml> + <xml name="seqkit_requirement"> + <requirement type="package" version="2.2.0">seqkit</requirement> + </xml> <xml name="xlrd_requirement"> <requirement type="package" version="2.0.1">xlrd</requirement> </xml>
--- a/test-data/add_zc_metrics.tabular Mon Dec 06 18:28:04 2021 +0000 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,3 +0,0 @@ -# File Number of Good SNPs Average Coverage Genome Coverage -MarkDuplicates on data 4_ MarkDuplicates BAM output 10.338671 98.74% -VCFfilter_ on data 7 611
--- a/test-data/add_zc_metrics1.tabular Mon Dec 06 18:28:04 2021 +0000 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,3 +0,0 @@ -# File Number of Good SNPs Average Coverage Genome Coverage -Mcap_Deer_DE_SRR650221_fastq_gz 0.439436 8.27% -Mcap_Deer_DE_SRR650221_fastq_gz 36
--- a/test-data/add_zc_metrics2.tabular Mon Dec 06 18:28:04 2021 +0000 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,3 +0,0 @@ -# File Number of Good SNPs Average Coverage Genome Coverage -MarkDuplicates on data 4_ MarkDuplicates BAM output 10.338671 98.74% -VCFfilter_ on data 7 611
--- a/test-data/add_zc_metrics3.tabular Mon Dec 06 18:28:04 2021 +0000 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,3 +0,0 @@ -# File Number of Good SNPs Average Coverage Genome Coverage -13-1941-6_S4_L001_R1_600000_fastq_gz 0.001252 0.13% -13-1941-6_S4_L001_R1_600000_fastq_gz 0
--- a/test-data/add_zc_metrics4.tabular Mon Dec 06 18:28:04 2021 +0000 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,3 +0,0 @@ -# File Number of Good SNPs Average Coverage Genome Coverage -Mcap_Deer_DE_SRR650221_fastq_gz 0.439436 8.27% -Mcap_Deer_DE_SRR650221_fastq_gz 36
--- a/test-data/add_zc_metrics5.tabular Mon Dec 06 18:28:04 2021 +0000 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,3 +0,0 @@ -# File Number of Good SNPs Average Coverage Genome Coverage -13-1941-6_S4_L001_600000_fastq 0.002146 0.16% -13-1941-6_S4_L001_600000_fastq 0
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/r1_seqkit_fx2tab1.tabular Fri Jun 10 06:11:08 2022 +0000 @@ -0,0 +1,101 @@ +#id seq qual length avg.qual +XXXXXXXXXX:7:1101:1582:1835#/1 NGCTTCAGTTGGTACAGGTGTGTCACCCGTAGTTTGTAGGCTTGGAAGCCTGTAAGCTGTAGGGAACGTGGCAAGAACCAGATCTGGCCTTCCATATCTC BP\ccccc`eeccdeef_`fgabeghehdfhb^caefhee^efcehaeehhWabehddeM_eehhdeebd\^^a_]`___aaa`c]`Y^aaaaa_]]]aY 100 52.19 +XXXXXXXXXX:7:1101:1610:1859#/1 NTTATGTGTTACGTGAATCTCCTGAAGACAGCAGAAACTAGGTTGGTGAATTCTTATCCATTCTGCCATTCTGTATCTTTTAAGTGGAGCATTTAGGCTA BP\cceceggggggiihiiiiiiiiiiihihhiiihihiiiihiiihhiiihiiihhiiiihhiiiifhiiihgigggggggeeeeeecccddcdccbcc 100 52.73 +XXXXXXXXXX:7:1101:1743:1871#/1 NCGGGATGGAGGCAGGGCAAGCGGATGCAGGCCCAGCCCTGCCCTTACAGGTAGCTGGAAGTGACGAAGGAGTGGGGCCCCCGGACTCTGCTCAGGTGGA BP\ccceeggggghiiidfffhghfhhfffhhhidgggffbbghhheggeg`ccbccb_bdbdbbccaV^aaX^a`]X[_cca]]X]bc]Y]b`X`Y`_` 100 52.42 +XXXXXXXXXX:7:1101:1536:1878#/1 NGGCCTTTTTGGACAGGTGGTGTGTGGTGGCCTTGGTATGTGCTTTCTCGTGTTACATCGCGCCATCATTGGTATATGGTTAGTGTGTTGGTTAGTAGGC BP\cccedggggbffhieghdbgdeghffffhih[aaefdhefhhihhiiidffdffhgbbagaeebbdcddb_bcccbR]YXT]_`ab``[^b^]bcbb 100 52.41 +XXXXXXXXXX:7:1101:2990:100153#/1 GCCAGGAGTGACTGTGTTGTTCTTTGCTTTATATACATAAGCGCATCTCTTGCCCAAATAGAATTCTGTTTCATCTCGGGCGTAAACACCTTCAATTTTA ___cccecaegceg[dgfhgfbgdfgfhhfhhdfedhffhhhhhh[fhbbd_S^aaegfg`dfhgghhbcgddd``geadcc_a_a_][_c]bccccbba 100 64.07 +XXXXXXXXXX:7:1101:1624:1906#/1 NCCAGGTTTAAGGCATTACATCGAGGGGCTGAACTTGAGACAGTCCCTGAAAATGTAAGAACAGGAGCTAGAACTTGCTTATGGGAAGGGCCTAGGGAGA BP\cceeegggggiiiiihiiiiiiiiiiiiiiiiihiihihhiiiiiiifhiihhihdbfhggggeeeeddbddbdccccccbcbccccccccccccc_ 100 52.70 +XXXXXXXXXX:7:1101:1666:1926#/1 NGCAAACTGGTCAGGACCTGGAGCTGCTTGCCTGGCCTTGGCACAAGAGGCCGACATATGCCCAGCCCCTAGGAGTGACAGATCCGTCCTCTGTGGGAAC BPaceeeegggggiiiiiiiiiiiiiiiiiiihihiiiiiihiiiiiiiiiiiiiiiggggggeeeeccccccbbcaccccccccccccccccccccabc 100 52.71 +XXXXXXXXXX:7:1101:2921:100163#/1 CTCCGGATGCCAAAGGATCTGACAGTGTATCTAGCTTTGGAAAACACAGGGGTCTGCCCTGTGAGCTGCTCCAACACCTTGGCTGCTCGCGTCAGTCTGT bbaeeeeegggggiiihihhhiiiigheegfhhgdhihhhhhihhfhhhhbgggghihhdggihggeggeeeeeeacccccbccccccccc_a__bbccc 100 67.82 +XXXXXXXXXX:7:1101:1513:1929#/1 NCACTATCAAGGTTAGTGTCTATATCTACTTGAGANAAAATACTGAAAATTCAGTGTATGAAGCCAAATCCTGATTTAACAAGTTATTGGTAGTATAAGT BPY`acccceeeY`bfefeggehe`gddgceh_eWBPYbedeehfdefhhh]fhehbffhh_eeehded`cfhhdheeeeeeeddccccac`b]]ZZa`T 100 49.64 +XXXXXXXXXX:7:1101:2759:100170#/1 CTGCTCATCACATTCCAGATGCCATCACAGGCAATGACCATGAATTCATGGTCGTCAGTGAGAGTCAGCACCTTGATGTCAGGAAGGGCTGAAATCATCT bbbeeeeegggggiiiiihiiiiiiiiiiiiiiiiiiiiiiiihiiihiiihiiiiiighhiiihiiiiiiigggggggeeeeeddcccccabccccccc 100 69.31 +XXXXXXXXXX:7:1101:1708:1937#/1 NGGTCGGTGTCCTTTTTTGGCGTCAAACTTATAGAGGGAAGCAGGGAATCTACCCAACCAAAGCCAATGAACAGTCAGTCAGTCCATCTAGTTAAGGTTC BP\accccecggghiihihifhihffhihf`fegfghf`\ebcefgiigdgeggdeeec`abcbcbbbcbccccc`bccbccb```bbcccccc`bb`bc 100 52.64 +XXXXXXXXXX:7:1101:2981:100211#/1 GGGGTCAGTGGGAAAGGTGTCAATGGGACTTCGGTCTCCATGCCGAAACACCAAAGTCACAAACTTCAACTCCTTGGCTAGTACACTTCGGTCTAGCCAG __beccceeeeggdhffghhhhiihhcghffhiefaghhhfffffffhhiigifhf\cdbdddeeeebcbbd_bb_^bcbaccbcbbbbaa^a_]b`b`a 100 66.08 +XXXXXXXXXX:7:1101:1688:1946#/1 NCCGCCTTCTTTCTCTACTTCGTGACCTTTTGTGGTCCCGAGACCTGCTGCATCTTCTGTCTGATGTTCGGCTTGAGTGTCTACTTCCTGAACGACTTCT BPYac``c[cccchdd]caddeddehhhhhd`cdb^b]cc[^c_^_acccddchdhdcd\bdd]bd^bbbU\^BBBBBBBBBBBBBBBBBBBBBBBBBBB 100 38.51 +XXXXXXXXXX:7:1101:2767:100225#/1 CGCCTGGTGTCAATGCGCACATCTGGAGTTCCCATCTCCTTCATGGCAAATTTCCGAATCTCTTTGAGTGCCCGAGGTGCACGCTTCTTGAAGCCCACTC ___eceeefgggeiihihhhhihihihfgac_cefffihehiiiihhhhhfghhfhiehiihihf_ddbbgddcb`c]`bbbccccc`bb`b_bcccccc 100 66.85 +XXXXXXXXXX:7:1101:1536:1959#/1 NGATACTGTTGGGTCAGGACCAGGGCCTGCACCACCGAAATTCTGTCTTTTACAAACTGGACCAAGCGGTTGAGAATACAGGGGCCGAAGAGTAGGATTA BSYaa^ccggcg`d^dba_\ffh\[Zbf_aZ[c_cfY_ee`aeaf[\eefeghhffg_]\\`db^cdb`[ZWZR[`b]bbbbWELT]__TX^SYY]]]bb 100 50.36 +XXXXXXXXXX:7:1101:2797:100234#/1 GTGCTGGTCTCTCTCCACGATCTCTTACGTGCTAGCAGGGTGAACAAGGACGCCTCGCTGTCATTGCACTCACGCCACAGGAGCCTGGCACATTTCCGCT JY^accWceeeaWdcZ_feW`R^eg^a[HPP^_ef[d[Z_eUQX^ae_^Q\`ZSbUadVLKV_Z_Z_`]Z_baa^\WW^TGXTXWR^GW[][``BBBBBB 100 44.12 +XXXXXXXXXX:7:1101:1552:1976#/1 NTGATGAGTTTGCTAATACAATGCCAGTCAGGCCACCTACGGTGAAAAGAAAGATGAATCCTAGGGCTCAGAGCACTGCAGCAGATCATTTCATATTGCT BP\cceeeegegfiiiihiiiiiiiiiiihhiefgfhhhihifghdhhiiighfhhifihhiiiaghhigggggcdebdbddddcccccdedddddddcc 100 52.72 +XXXXXXXXXX:7:1101:1748:1978#/1 NCGCTGAGCAGGGCAGGCAGTGGTGGAGGCAGCCCCCCAAGACCCCATCTCTATCACAGTGAGAGCATCTGAACTCCAAAGCCACGACAGAACAGCTCCC BP\ceeeeggggghiiiihihiiegihhihiifiihhi`gfffggggeeeeeeddcdbd_bccbcccbccc`bbbbccccbccccccccaccbbb_`bcc 100 52.66 +XXXXXXXXXX:7:1101:2779:100239#/1 TGGGTGCTCTCCTTGGTCAGCTGCTGCTCGAACAGAGCACTTCTAGATACAGAGTTGGACCCAGACACAGCAGGGGTGGCCATGGCGGCTGGGAAAGACC ___^cc^ceggeeghddghafhXbegefbaYYbfhfgf_ae[egegc_cccaacaefg[bZbZ\\ZbZZ^gZZ^[]WW\_^bBBBBBBBBBBBBBBBBBB 100 40.42 +XXXXXXXXXX:7:1101:1593:1980#/1 NGGCACCAGAAGCATGAGCATAGGCAGAGCCATTTCCACCATGCTGACGGCAGGCAAGAAGAAGACAAAAATGAACCCCTTTCATGCTTGTTTAGAAATG BP\ceeeeggggfiiiiiiiihiihiiihfihhiiiifhhhiiiiihhiiiiiihhigggggeeeeeddcccccccccccccccdcccdccccccccccc 100 52.71 +XXXXXXXXXX:7:1101:2946:100242#/1 TGGGGATGTTGTTAAAAAAAATACAGGCTCCCCCACAACTGGGGTGCCTGGGGGGAACTTGGTCTGCTTCAGCCCAAGAGGAATCAAAAGATCAAAAGCA ___eecccgggggihhfhihfdfhhiihhiifiiddbcd`\eghL\^a^bdccccTTWRY`bRYYXSYb``bbca`acW^a`^bbccccc_bb`bbcbac 100 58.29 +XXXXXXXXXX:7:1101:1987:1781#/1 NTTAGCAGGTCCTCGTAGCGTTTCCGCAACTCTCGGAATCTGGAGTCTTCGGAGTGCAACTCTGAGGGTCCCGGGAAACTTGCGCGGCTCGCCTCGGCCA BP\cceeegggggiiiiihiiiihiiiiiiiiiiiiiiifiiiihhghiiihiggfgeeeeeebddcccccccccaccccccccccccccaacccXa^a[ 100 52.65 +XXXXXXXXXX:7:1101:3046:100006#/1 CTGTACAGCATGGATGTGGACAGGGAAAACAGCAAGTGCACACAGTGGGACAGGCCACAGGACAGGCTGGGAGTGAATAAAGAGTTCACACTGCTTCCCT bbbeeeeegggggiiihiiiiiiiiiiiiiiihiiieghiihhihffghiiiiiihiihhiiiggggeeec\bZ^bcbccc_]^]_b`bc`bbccbcccc 100 66.70 +XXXXXXXXXX:7:1101:1900:1788#/1 NCCCGCTGCCCACGCCACTGTCCCGGCGCTGCCCTGGGCGCGGAATGCGCGTTAGGCAATCCCCGGTCTGCGCGTCCCACACGCAGATGTGGCCTGCCAG BP\ceeeefggfgiiihiihiiiifhhiiihhiihiiihgeecccccccccaccccccccccccac_accca]aa[aacccccccccccdbccaccccb_ 100 52.64 +XXXXXXXXXX:7:1101:3214:100027#/1 GGCTGAGGTACTGAATGAGGAACAGCAGGAGGTAACGTCTGAGGGTGCGGCTGGGGAACGGTTTGCACAGGGGTGGCTGTAGGAGCAGGAGGTGAAACAC ___eecee^cegghhhhhhfhhfgfhhfhhhh^eggfcefhffhbU^eghhehgggTXZ\aTTX\RRYTT[GWROTWW[GG]YGXW[baOQEQW]b`]XW 100 49.49 +XXXXXXXXXX:7:1101:1848:1879#/1 NCTTCTTCTTCCTCATGTTTTTTGATCAACTGCTCCACTTCTTTTTGTTTGAGAACTCTGATTACTGTCTTTCCATTCTCTCTTGTTAGTGTTGCAATTT BP\cceeegggggiiiiiiiiiihhihhiehfhihhhiiihiiiihfghihdggfhhiiihihh_ddcggeefdb`beeeeeddcddbdbbcc`bbcccc 100 52.70 +XXXXXXXXXX:7:1101:3237:100032#/1 CTCCCGAAGTGCTGGAATTACAGGCATGAGCCCCCACGCCTGGCCTGATCAAGCTGTTTCTCTTGCTTGGAATGCCCTTTGCTGCCTGGCCAGCTCCTAG _b_eeeeegegggiiiiiihiiffegfhhihiiiiiighiffhiiiiiiiiihhiibdeggggeeeeeebcbdbcbcccccccccccccccccccccccb 100 67.87 +XXXXXXXXXX:7:1101:3027:100049#/1 CACAGAAACACGGGTTCATGATGGTGAATGATATAGCGGGTGACAGATGGCTACAAACCAGTCATAGGCCATCACACTCAGGAGCATGTCTCTCTTCCAT bbbeeeeegggggidghiihhihidgfhiihihfiiiiii_eghiiiihihhiiiggggeebdddcddddcccccbbcccccccccccbbdccccccbbc 100 67.75 +XXXXXXXXXX:7:1101:1756:1891#/1 NCGATGTTGAAGCCTGAGACTAGTTCGGACTCCCCTTCGGCAAGGTCGAAGGGGGTTCGGTTGGTCTCTGCTAGTGTGGAGATAAATCATATTATGGCCA BP\cceeegggggiiiiihiiiihiiiiiiiiiiiiiiiiiiiiigiiegghige]_ccaaccc_bbbbcccccc_bbcbcbccccdccccddddccccc 100 52.67 +XXXXXXXXXX:7:1101:3238:100065#/1 GGATGATAGAGTGTGGGAGAGAAAAGGGAGAGAGACTTTGGAGCTGAGTGGGGACCGCCGGGGAGGGGAGGCCTCAGAGTGGCTCAGCTGTAGATGCGGC bb_eeeeegggggdfgifhghhiiiiiihghhfgdhihiiifhhiiiigghiiiiigeecccc_accc_ccccbcbbbc_bccccbcbcc_bccdcbcca 100 67.15 +XXXXXXXXXX:7:1101:1915:1901#/1 NTAGAGGCTTACTAGAAGTGTGAAAACGTAGGCTTGGATTAAGGCGACAGCGATTTCTAGGATAGTCAGTAGAATTAGAATTGTGAAGATGATAAGTATA BPY`cceegfggfihgghhhegfghfgihdfhhhhhhfeffdgighiiiiifhiifdgdgecddc_cbbbdbbdcb__`bcc__`_`bbcbbccccac`c 100 52.64 +XXXXXXXXXX:7:1101:3198:100082#/1 CCCCCGCTCAACTACAAATGTCAATATTGAATGAAGCATTAAAAGACAAACATAAAGTAACTTCAGCTTTTATCTAGCAATGCAGAATGAATACTAAAAT b__eeeeeggggfiiiiiiieghhffhfhiiiiiifhiiiiiihgfhhiiiiiiiiigghhihiiiifegfggeeeeededcdcddcccccddcccbbcd 100 68.63 +XXXXXXXXXX:7:1101:1964:1931#/1 NGGGGTCTTAGCTTTGGTTCTCCTTGCAAAGTTATTTCTAGTTAATTCATTATGCAGAAGGTATAGGGGTTAGTCCTTGCTATATTATGCTTGGTTATAA BP\`Z`cdggggfhhhhghfghhhhhhhhhhffhhhhhhhhdggfhhhhhhhhghhhfgfceghfhhhhdgdgdggbggfgfebdeeeedcddbbccccc 100 52.70 +XXXXXXXXXX:7:1101:3088:100091#/1 TCCCACGTTTCCCACTTTAAAACAGAAGACTGCAGAGGATGTGGTAGAGACTGCAACTGCCAATGTAGCATCCGTTTTCCCAATTTCTCAGTAACAGGAT bbbeeeecgggggiiiiiiiiihffhihiiiiifgdghbghggighhhihhiiihiiiihiiiiihiiiiggggebcecdcbddcccdcdbccccccc`b 100 68.56 +XXXXXXXXXX:7:1101:1840:1948#/1 NCAGGGTGAGGGGCTTCGTCTGCTGGATGTACTTGTTGCCGAACTGAGTGACCCCCCGGGGCCAGCCGGTCTGCGAGCGATTGGGCGGTACCACAGACAT BP\ceecegggggiiihhhhiiiiiighhfhhiifhiiiiiiiiiiiihiiifhhgccccccacccccccccccccccccccccccccacaccccccccc 100 52.69 +XXXXXXXXXX:7:1101:3105:100094#/1 GGGAACTCCAGGGATGAACATGAGAAGGCCCTTCTGCTGTAGTACTAACTGCAATCAGTGTCTCGGGCTTCATGGGCTTGGCTTTACGTAACAAGCCAGG ^[[^ccccc^eccgf\R`bggfffbffhhfhbXc]Xcfcg]ece_cegfadafhgfheNWW\_]eZFZW`^HVZ]UZ`ZKZGT\b_b[KYXGY_XQWbW^ 100 50.33 +XXXXXXXXXX:7:1101:1958:1952#/1 NTCATGGTAGGGGTAAAAGGAGGGCAATTTCTAGATCAAATAATAAGAAGGTAATAGCTACTAAGAAGAATTTTATGGAGAAAGGGACGCGGGCGGGGGA BPY`cccc^aaecf`e[dbeeedaaeVefhhhdeXc_fehdb_eedhhhed\acbefdhdddee`bbeeeeeacca]_aa__]]_aaaaaa]aaa_]XaT 100 52.40 +XXXXXXXXXX:7:1101:3190:100106#/1 CACGGTTAGGGTACCGCGGCCGTTAAACATGTGTCACTGGGCAGGCGGTGCCTCTAATACTGGTGATGCTAGAGGTGATGTTTTTGGTAAACAGGCGGGG bbbeeceegggggiihhhihifhiihiiiiifgeghihhhhhfhgfecR]_bcccccdcccdc]b]bbccccbccc^`bc_bcccaccccccccacccac 100 64.50 +XXXXXXXXXX:7:1101:1993:1999#/1 GTTTAATTGTGGGAGGCTGAGAGCAGCATTTTTACCAAATTGGTGTAAAAATGAAACGGGGTCCAGACGTGTACACTGACAGTTACAGTAAATTTCAAAA bbbeeeeegecgfdhhiiihihiiiiiiiihiighihhfhihhcf_ehhhiiiiihihhggadgggeeeccddddbccccccccccccedccecccdccc 100 68.03 +XXXXXXXXXX:7:1101:3117:100110#/1 GTTTTATGTTGTTAATGTGGTGGGTGAGTGAGCCCCATTGTGTTGTGGTAAATATGTAGAGGGAGTATAGGGCTGTGACTAGTATGTTGAGTCCTGTAAG ___eeeeeggggfiiiigihghiibfcgefdgfhii`ghiefefhghhaedghdhibfghfhiff^`gbggeeeedbcbdbbbccdedcccbbbcbbbcb 100 67.19 +XXXXXXXXXX:7:1101:2159:1798#/1 NCTTCCAGTCCCCTCCTCGATTTCACACCGGGACACACACCTGGGTCAGGTGAGCATGACACACAGCCCCCAGGATGGGCACCCCACCCTGCAGAGCAGA BP\ceeeegggggiiiiiiiiiihiiiiiiiihhiiiifiiiiiifgiiiggggggeeeeeddccccaccccccccccccccccccccccccccbccccb 100 52.69 +XXXXXXXXXX:7:1101:3147:100111#/1 AGAAATTATTTTTAAATGTCAGAGAGAATGCTATTATTGGCCAACTTGAAATTTCCTAATTAGCTATCTGAGCTATTTAAGTCTGTACTTCAGTGTCTTC bbbeeeeegggggiiiiifiiiiiiiiiiiiihhiiiihhiiiiiiiiiiiiiiiihigiiiiiiiiiiiihihfcghhihbggggfgeeeeea_bdddd 100 69.60 +XXXXXXXXXX:7:1101:2152:1838#/1 NGGGAAACGCCATATCGGGGGCACCGATTATTAGGGGAACTAGTCAGTTGCCAAAGCCTCCGATTATGATGGGTATTACTATGAAGAAGATTATTACAAA BP\cceeegggggiiiiiiiiiiiiighigggggeeecccdccccdcceccccccccccccccccccccdccc^bbccccddccdcccccbcccddcccc 100 52.66 +XXXXXXXXXX:7:1101:3065:100152#/1 CACATAGTCAGCCTGCTTGATCACGTCGATCTTGTCCAGGAAGTACTGGGCACAGTCAATCAGCTGGTACTCGTTGGAGCGTTCGTAGCAGGCACGCACT ___ecacccggcgfhhhhhhh_gfdeghhhhhhhfhhdcdhXfX^f_eghhfUegbfh_be__dhbb`g`bga_aZ^]bdaX\^a^`aa`_[_aW]][]a 100 62.63 +XXXXXXXXXX:7:1101:2180:1843#/1 NTAGGGTGTAGCCTGAGAATAGGGGAAATCAGTGAATGAAGCCTCCTATGATGGCAAATACAGCTCCTATTGATAGGACATAGTGGAAGTGGGCTACAAC BP\cceecgggfehiehihhihhhhdffhihifdhhifghhhiiihihihiiihiiiiihiiihfhiffefgfdegeecac`d]bddbb_bcaacccccc 100 52.70 +XXXXXXXXXX:7:1101:3154:100159#/1 GTTTCATCATGTTGGCCAGGATGGTCTCAATCTCTTGACCTCGTGATCAGCCTGCCTTGGCCTCCCAAAGTACTGGGATTATAGGCGTGAGCCACCGCGT bbbeeeeegggggiiiiiiigiiiggiiiiififhiggiiiiifhiiiighiiiiiiiiihiiiiihhffffgggdgeeeeeedbdcaccaccccccaca 100 68.83 +XXXXXXXXXX:7:1101:2125:1861#/1 NGTGGGAGCAGCTGGCTGTGTGGCACCTGCTGTGGTGGCTGCTGGCGTGGCCGGAGTGAAGGGCAACGTGGCAGGTGCCGGGGGCTGGGCTGGATTCCCT BS\cceeegggggiiiiighghihfhifhhihfgfeghfbffgffaf_efffegX]Z]]_bccPZ^`aX`a]`acBBBBBBBBBBBBBBBBBBBBBBBBB 100 38.83 +XXXXXXXXXX:7:1101:3198:100173#/1 TGGCAGGTGGTGGTGGTGCTCAAAGAGCAGGTCCAGGTGGAAAGTGAGCACCGACAATGGCTGCAGCAGGAGCAGCAGCTCTGTGGACAGGGAGGGACAA ___cccccece`gbZaffgadfgg_ddffghbafffdaffffhhedghhhhhffhgggadc_`bbbba^a\\XXT^[^[Y_]`Y]b]`b__aaBBBBBBB 100 44.48 +XXXXXXXXXX:7:1101:2076:1911#/1 NGGAGTAGGAGTACCCAGTCTCTAGTGCCAGCTGCAAGCGTTAATTTGGTTAAAGTCTCCTTGATTGTCCTGTTCATTCTTTCTACCTGACCTGAACTCT BS\ceeeegggggiihiiiiihiihgiiihiiiiiiiihhhihghiiiihhiiiihihiihiihiiihhiiihfggggggeeeeabcdbdddcccccccc 100 52.81 +XXXXXXXXXX:7:1101:3166:100190#/1 CCGGCCGAAATTGTTTTTTAAATTTACGTGTCACCCTTCATGCAGGGCCCTGCTACTCTTCGTAGCCCTCCTCCATGTTTAGTGTGGGTGCGGCTGCAGC bbbeeeeeffgegdgigfiihhiiihiifggghffc`gfffgheifffagdbddgdbeced`bdcaccbaccccb`b`bccbY`bccaX]_accaa^R^b 100 63.87 +XXXXXXXXXX:7:1101:2196:1920#/1 NTGGGGTGGGTATGGCGGGGCCAGCCTTGCTCAGTGCTGTGGTGATGGCCACAGTAGCCTCGGGGGGCACAGCCACGGCTGGGGGAGCAGGCCCTTCCTT BP\ccc`ceeceehhhhhhh[aZZZ^U]LZ]]ZTZ_]]TTY_KTT]]`[a]_[[R]]R__aR[aaaaTEW^XP[GRLTTOOXaaBBBBBBBBBBBBBBBB 100 40.29 +XXXXXXXXXX:7:1101:3225:100207#/1 GCTATTTTCTGCTAGGGGGTGGAAGCGGATGAGTAAGAAGATTCCTGCTACAACTATAGTGCTTGAGTGGAGTAGGGCTGAGACTGGGGTGGGGCCTTCT bbbeeeeeggfgghiiihiYcghiihiihiififhfghfhhhhhhggggggeeeeeddddddcdcac]`ababbbbacccccccbcccc[aaacaccccc 100 66.30 +XXXXXXXXXX:7:1101:2115:1927#/1 NCTCCTTCTTGGCCTGGAGGCGCTCTTCACGGCGCTTGCGTGCTTCCTTGGTCTTAGACCTGCGGGCCTCAGCCTGGTCAGCCAGGAGCTTCTTGCGGGC BS\ccecegeeggiiiffggfhhiiiihhdhihfdghddfggeeeeecdddZ]bcdcbcccbccacaaccccccc^`YYYX`bW`_`a[`_b``_baccT 100 52.51 +XXXXXXXXXX:7:1101:3019:100219#/1 GGCGGGTTTTAGGGGCTCTTTGGTGAAGAGTTTTATGGCGTCAGCGAAGGGTTGTAGTAGCCCGTAGGGGCCTACAACGTTGGGGCCTTTGCGTAGTTGT _[^ccc_cggccgghdgcbgdf_WcXae[cbefffgbefh_d`dgddb]aaZTZW__cc`bb]ZZ_^aaZ]a^`b_Y__ab[`_XT_^bbbbaBBBBBBB 100 44.46 +XXXXXXXXXX:7:1101:2179:1937#/1 NAGGAATACATATAGTCATCATTGCCAGACTTAATATGAGAGGTGAAATGTTCGATCCAATTTTCCTTCCTGGATAAGTTTTTCTTTCCTATCCCTCTCA BP\cceeeggggghigfghiiiiiiihiiiiiiiiiiifhhhheghhiihhhihiiiiiiiiifhghhiiiiihhgffdgfgegeeeeeeeddcddcccb 100 52.73 +XXXXXXXXXX:7:1101:3202:100230#/1 CTGAAAAACAAAACAAAACTTAGCTAAGTTTTATGGCAAGTGGGGGCAGGGTCAGGTGAAGAGGTAGGAATTGCCTGAGGTTGGGGGTCCCTAAAACATA __aeeeeegggggihhhiiiiihihhhhfghhhihhhiihfffgdfhhihiddggeceeeeedcbbdcbbbcbcc]bbcc^abccccT[acbbcccb^`b 100 65.28 +XXXXXXXXXX:7:1101:2149:1945#/1 NGTGTGGTGGCCTTGGTATGTGCTTTCTCGTGTTACATCGCGCCATCATTGGTATATGGTTAGTGTGTTGGTTAGTAGGCCTAGTATGAGGAGCGTTATG BPYaccccegggghhhceghghhhhhhhhhfhhhhhhhhhhhhhffhghhhdffghghhbfghgfddgddcdddbebcbbbbbbbdcdbbbbaaaaaaab 100 52.67 +XXXXXXXXXX:7:1101:3211:100242#/1 CTGTTCCCCAATACCTGCAATTCACAGATATAATTTAGCATTTTTGTTTTTATATACTAATTTAGGCAAAACCCCCCCGCCACTGAATCGTCCAACAAAA ___`acacgggcghfdddc_gbggghddgfgfhhccdab[e[_Xbe^^cacdfgbaa[caSWWbfbf`efc_Zbg[XZaccaacccbcc[[WW^bbW[[a 100 61.18 +XXXXXXXXXX:7:1101:2169:1964#/1 NGGGAGCAAAAAGCGTGGGTACAGAAGCGAGAAGCGAGCTGAGTGGTTAGTTCAAATCAAGGCTTGGGGTATTTCCTGGTCATTTGGGGAACCTGAAACT BP\ccceeggggfehfhhh_fhifbgf[effhh`cfV__`gefccg`ddg`d`beeeadddbcccaaacNWY_bZ]`bb_YY__aGSTXGTW^R^R_b_` 100 50.12 +XXXXXXXXXX:7:1101:3168:100244#/1 CCCTTCCTGTGTCCATGTGATCTCATTGTTCAATTCCCACCTATGAGTGAGAATATGCGGTGTTTGGTTTTTTGTCCTTGCGATAGTTTACTGAGAATGA ___eeeeegegeghiihfbgghhhhfhaggiiiidbfhfhfbdegdfcffgdgfhhfhhfceefghicfffeeceddbddba^acc_bccccc[bbbcc_ 100 66.77 +XXXXXXXXXX:7:1101:3005:100246#/1 CAAAAGTTAAATGAAAAACCACAAGTTTAGTTTGACTCCGTCTCCTAGGGTGGATTTCATTCAGATATTTGTTCCATATTATAGGAGGGTGGATCCTAGC bbbeeeeegggggihhhihihiiiiiiiiihhihhhihiighiiiiihii^efaegfffhhfhhhiihhiidgggggdeeeeeeedccaZ\_accccccc 100 67.69 +XXXXXXXXXX:7:1101:2313:1789#/1 NTGCGCCTGGAAGCCGCCAGGCCGCAGCGCGGGGAACAGGGCGGCCACCCGGCTCAGCAGCCGCTCGCAGGGTCCCGGACCCGCCGCAGCCTCGGCTTCC BP\cceeegggggiihiiiiiihiihiiifhheccccccaccccccaccccccccccbcccccc_a]Zaaccbb`aaacaccaccccaaacccX]^^abc 100 52.58 +XXXXXXXXXX:7:1101:3253:100014#/1 GCGGATGATTCAGCCATAATTTACGTCTCGAGTGATGTGGGCGATTGATGAAAAGGCGGTTGAGGCGTCTGGTGAGTAGTGCATGGCTAGGAATAGTCCT bbbeceeegggggiiihihiiiiiiigfhiafbeccb_fdgaffhhhhhihihihhiieT]abcccccccccbb_WY]_bbbbccccccccbcbb`Y`bb 100 64.18 +XXXXXXXXXX:7:1101:2361:1794#/1 NGTTAGGCTCTCCACGACTGAGCTGGTCTCGGCACCAAGGGGGTCAGATTGCTTAAAGGCAAGGAGTTCAGGACCAGCCTGGGCAATGTGGGGAGACCTC BPYacceeegggfhhhhfhhfhhb_eaefdgghhfgfffgbfcfdeggfgeeeeeddbd\``aaabbbbdbbbb^[[^aba_aababb`_Y[aaaR[a`b 100 52.45 +XXXXXXXXXX:7:1101:2337:1794#/1 NGGGAAGGTGTCTGTCATCGTCCCCAGGAGGGAGGTGGCGTTAGCTGTTTGTCCTGTCATTAGGTTGGTAACTCTCCAAGTAACATTGAAGATCTGGTGA BP\c`ceceggggiihiiihiffffghi`ghhggi^ce`f_faghihbghigegdgR_ceeeeeU]`c^`_bcbbccbbb]`bcbcb`b`cbbbc_bbcc 100 52.47 +XXXXXXXXXX:7:1101:3284:100039#/1 TTGGGCGACAAGGACATGGAGCTGGAGGAGAGCGTGGAGGAGCGGCTGTTGAGTTCAGAGCCCGAGTCCACTGCCACCGAGGCCGGGCTGGCGGCCAGGG bbbeeeeegggggiihiiiiiiiiihhihiffhifhiihhifhigeec`db`bbccdcccbcccccacccccccc`bcc_acacccccccca_a[_BBBB 100 46.93 +XXXXXXXXXX:7:1101:2477:1795#/1 NGGCGGTGCACCGAGCTGGAGGCTGCCGCAGAGGAGGCGGCCGCCGCTGCGGCCATGTACGTGTAGGGGTAAGGGAACAGGCTTCCGAAAGGGGACATGG BP\ccccefeeggffghffhhihhhhhfifhhiidghfddcca_aWaWac_accabccdcaX`R^bba_X_bcccW`^acc_^[X`_[[[a_acacc]][ 100 52.30 +XXXXXXXXXX:7:1101:3310:100056#/1 GGGCGATTGATGAAAAGGCGGTTGAGGCGTCTGGTGAGTAGTGCATGGCTAGGAATAGTCCTGTGGTGATTTGGAGGATCAGGCAGGCGCCAAGGAGTGA bbbeeeeegffgfiihiihiighiiihiihhiii\edgfhiddggeggeeeedbddcdbdcccbbc^a`bcdccb`aabbaccb^acccacccca`cX`b 100 65.89 +XXXXXXXXXX:7:1101:2355:1821#/1 NTGTATTGAAGCCAAATTTCGTGCCAGGGTGGTGTTAGAATGTGAGCTATTTTCATTATATTTGGACTAGAATTTTTTCTTTTAGGAGAATGGTGGGGAA BS\cceeegggggiiiiiiihfgiihhii^egbffhfhfhhiehhhiihiiiiifgh`ffghiiighfhhgggfgggcdddddcbbbc`abcc_bcccac 100 52.78 +XXXXXXXXXX:7:1101:3420:100060#/1 GTGAAAAATGTTTAATTTACTTCAAAAATATCTTGCATAAGTATCTCATCCCTAAGCTCAAACAAACAAGAAAATTAAAGGCGGAAAGAATACATAAAAT ab_eeeeeggffgihhhihgfdhhhhihf]ghiihefhhig^fgbghbfdhhiihbffhhiihiiihhhhhcfhigfhdg`dFXZaccbcbcccddcbcc 100 56.56 +XXXXXXXXXX:7:1101:2418:1834#/1 NCGGTTTCAGTCGTCACTGCTGCCCCAGCCTTTCGCTGTCCTTCTTGCAAAAAGCTGCTCCCATCGGTATACCAGGTGTGGTCGGCGTCTGGGATGGGCT BPYcaceeggggfiiiiiiiihifiiihiiiiihdfhhfhfhiiiiihiihhhhhihihhiiegggeeecbeddcabbbcccccccc[aaccc`bccacc 100 52.67 +XXXXXXXXXX:7:1101:3267:100061#/1 CTGGGTAGTTCTGGCTCCGGGTCTCTCATGAGGTTGCAGTCACGATATTGGTTGGAGTTGCAGCCATCAGAAGGCTAGACTGCGTGTGAAAGACTCACTT _bbeeccegggggiiiiiihigghihifhiiiiffhiiihhihidghiihheghhhighgggfeeeeeeccddcccccccccccaacccdcccccccccc 100 68.01 +XXXXXXXXXX:7:1101:2378:1838#/1 NGCCCAACCAACAGCTTCAACAGCTATTGCAAGGTGCGCCAAAGGCATCTTGTCATCCCTCACACGAATCTCACTTCCTGTGAATTTGCAGGGAGGCAGA BP\ceeeegggggiiiihiiiiiiiiiiiiiiihfhiihiiiiiiiiiiiiiiiiiiiiiiggggeeebcddccccccccccddddcccdcccccccccc 100 52.71 +XXXXXXXXXX:7:1101:3416:100083#/1 GCCCAGTCCTGGGGGCAGGGGAGAAAGGGAGGGGTGAAATGAGAAGAGCCCCGTTCTTCCTCAGTGCTGGGGGGTTGGAGACACCACCCCCTTCTGCTGC ab_eeeeeggggfiiiiiiiighghhiiihhhiiL\bgeeeeeeddbddcccc^acacccccccbccccccccc]X_abcbcccaccacccccccccccc 100 61.17 +XXXXXXXXXX:7:1101:2481:1853#/1 NGCAGGTAGAGGCTTACTAGAAGTGTGAAAACGTAGGCTTGGATTAAGGCGACAGCGATTTCTAGGATAGTCAGTAGAATTAGAATTGTGAAGATGATAA BS\cceccgggggiiiiiiihiihhfhhihiiifhgiiiiiihiiiiiiiiiiiiiieggeeeeeebdddbddccbbccccccbbbccbcbcccccccdb 100 52.78 +XXXXXXXXXX:7:1101:3411:100111#/1 GTGGTGGCCTTGGTATGTGCTTTCTCGTGTTACATCGCGCCATCATTGGTATATGGTTAGTGTGTTGGTTAGTAGGCCTAGTATGAGGAGCGTTATGGAG babeeeeegggggghiihiiiiiiiihdfgiiiiiifiiiiiiihiiiiefhhiiiegfhggghgggfbddeceeedbdbb_bedcccccccccccccba 100 68.20 +XXXXXXXXXX:7:1101:3258:100128#/1 GCTGTGGCTTTTTTAAGGATAACTACCTTGGGGGCCTTTTCATTGTTTTCCAACTCCGGGATCTGGTCACGCAGGGCAAAAAAGCTCCGTTTTAGCTCGT _b_ecceeggggfihghifffhhfghidghhiihighiihighiighhiifdffggggeecccccbccbccccca[_aaccccccbbbcacbcbbcccc[ 100 66.63 +XXXXXXXXXX:7:1101:2252:1856#/1 NCAGAAATATGGCAGTGCCACAGAGAGTGTGTCCTCATTGGAGTACTTGCGCTTAAATTCATCCAACACAAAGGTACTCTTGGGCAGGTGAGCGAAGGGG BPYcaccce^ecc^e`begg_a_fXQ`[Q_eb_b`d]ee^[ac^e^e[cbe^edeedVWW_bb\_\dd`bdGV^aaab``UUG\\\]_T_]aaaZO[T]a 100 50.04 +XXXXXXXXXX:7:1101:3428:100129#/1 GTTGGAGTGTAGGATAAATCATGCTAAGGCGAGGATGAAACCGATATCGCCGATACGGTTGTATAGGATTGCTTGAATGGCTGCTGTGTTGGCATCTGCT ___eeac\cecggfhhihihfhhiiiihiiihfhffihhhhihhidg`fgfgeeccccZ^^\]bbbc_bb`bbccabcbb`ba[]`YbS]Q[RSRX`bb_ 100 60.12 +XXXXXXXXXX:7:1101:2394:1871#/1 NTTTATTTCTAGGCCTACTCAGGTAAAAAATCAGTGCGAGCTTAGCGCTGTGATGAGTGTGCCTGCAAAGATGGTAGAGTAGATGACGGGTTGGGCCAGG BP\ceeeegggggiiiiiiiiiigghiiiiiiiigihihhiiiiiiiihighiiiiihgeggggeeeeedddddb_bccbcccdcccccc_ccccccccc 100 52.70 +XXXXXXXXXX:7:1101:3387:100138#/1 TTGAGGGAGGGCAGACACAGGCTGAGGAGAGTGGATAGGAGCAGGAGAACCTGCCACACCCCACACCCCACTGAGAGCTCATCAGCTGCAGCCCTGGGCC bbbeeeeegggggiiiiiiiiPdgfhihhfgXafffhfhhhiiiicfgifhhhegegceeccccccccc_aacc``__cccccbbcccc`bcccc`accc 100 63.66 +XXXXXXXXXX:7:1101:2269:1904#/1 NGCACCTGTAATCCCAGCTACTCAGGAGGCTGAGGCAGGAGAATCACTTGAACCCGGGAGGTGGAGGTTGCAGTGAGCCAGGGTCAGGCCATTGCACTCC BPY`cceceaga^dadghhhgfhhbfghhhhhhhhfhgad`ec[ecedbbbecbdghgaaXKU^GZ\GTX`bRY]__bbT^aaRRWbb^a^]bbbbbb^` 100 49.98 +XXXXXXXXXX:7:1101:3444:100163#/1 TGTGGCTGTTCTATGAACCACCTTCTTCTTTCTGCGAGCAGTTCCTTTCCCACCAATGCGCACTTGTGCCTGCAGTTTGGCGAGGTTTTCCTGGGTCATG __\c\cc`^`c^be``bad`ddegaX`dgegfaIXW^^OW^O^ce]a^ae^egffgd_VZ_FT\ZV_]c`bb_bX]Z]R^baQREHW`WY_bYXGX^^BB 100 46.94 +XXXXXXXXXX:7:1101:2259:1943#/1 NTCTTCCTCATCTTCTTGTTCTTTTCTTTTTCCTTCTCCTTCTCCTTTTTCTTTTGTGACATGATTTCACTCTTGTTACCTACGCTGGAGAGCAGTGGTG BP\accc`b[QbKb`cd_``dedddcddYXecSbdI^P^XcSXbX^Y^^c^a^cc_HHXacIXWM\WWWa\HW_]NV\``_BBBBBBBBBBBBBBBBBBB 100 39.63 +XXXXXXXXXX:7:1101:3371:100179#/1 GGTTCTTCGAATGTGTGGTAGGGTGGGGGGCATCCATATAGTCACTCCAGGTTTATGGAGGGTTCTTCTACTATTAGGACTTTTCGCTTCGAAGCGAAGG abaeeeeegggggfgegheghii[eghiicaacccccccdccddccccccc`bbcccccccc[aacccbccdcddbccbccccccccccccccccc^aaa 100 65.77 +XXXXXXXXXX:7:1101:2371:1957#/1 NCCGTCGGAAATGGTGAAGGGAGACTCGAAGTACTCTGAGGCTTGGAGGAGGGGAAAATAGAGACCCAGTAAAATTGTAATAAGCAGTGCTTGAATTATT BP\cccccc^ggghbfdcghf^ecfghhhhhaffbgfd[egfcd_GWbfZcagU^N^`__ZZ_b^aaaa]]`bbc_RT]]b_b_SYXGJS_b]^bb`]_a 100 49.81 +XXXXXXXXXX:7:1101:3311:100186#/1 GAAGTGTCTGACTAAAGTCCGTTGCCCATTTTTTAATCAGGTTGTTCATTTTCTTACTGTTCAGTTTTAAGAGTTCTTTGTGTATTTTGTATGACAGTCC bbbeceeegggggiiihiiiihiiiiiiihiiiihhhhhhiefhhiihiiiiiiiihiiiiihhhghihhhffdddggggeedeeeedbdbddccccbcb 100 69.12 +XXXXXXXXXX:7:1101:2394:1961#/1 NCTGGAAGTGATGGTCCGGAACCGTTCCTGGCCCGCTGTGTCCCAGATCTGAAGTTTGATAGTTTTGCCATCCAGCTCGATGGTTCGGATCTTGAAGTCC BP\cceeeggeggifhiiiiihifhhihhffhiifgfffgfghihhhfhiihiigggefgeeceeeebbddbdcc`bcccccaY``aaacabcb[`bbcc 100 52.65 +XXXXXXXXXX:7:1101:3438:100192#/1 GGCGGATGAAGCAGATAGTGAGGAAAGTTGAGCCAATAATGACGTGAAGTCCGTGGAAGCCTGTGGCTACAAAAAATGTTGAGCCGTAGATGCCGTCGGA bbbeeeeegggggihiiifghhiihiighihiiiiihiiihihihiiiiiiiihiiifhhiefgggeeeedcdcc_acabbcccccacccbbbbcXa]a] 100 66.94 +XXXXXXXXXX:7:1101:2333:1962#/1 NGGTTGCTTGCGTGAGGAAATACTTGATGGCAGCTTCTGTGGAACGAGGGTTTATTTTTTTGGTTAGAACTGGAATAAAAGCTAGCATGTTTATTTCTAG BPYacccca]ee_c\egafbgfgghf]fhfdbg__a^efghaffcf`eghefhdghhdg^`[]a`bab]`bYb]b__bbbbabb__bcbbddbbbdbd`] 100 52.52 +XXXXXXXXXX:7:1101:3479:100209#/1 TAGAGGTGGGAACAAGAAAACATTGATATAGTTTTGAATTAACATTAAAGAGGCAAAATTTCACATTTAAAATGGCCCAAAATATCCCACTATTCATTTT abbeeeacgggggiiihiiiiiiiiiihiiiihihiiihiiiiiiiiiiiiiiighifgiiihiiiiiihiggggdgeeedcddeddccccccddddded 100 69.20 +XXXXXXXXXX:7:1101:2459:1990#/1 CGGGGAGGTAGCGATGAGAGTAATAGATAGGGCTCAGGCGTTTGTGTATGATATGTTTGCGGTTTCGATGATGTGGTCTTTGGAGTAGAAACCTGTGAGG a_beeeee`cggghiiiihhdfgfdhhiihiiihhiiihiffhifgefhifhhihfhggegeabcdaaddcdc`_`bcccccc[bbccccccccabbcb^ 100 66.80 +XXXXXXXXXX:7:1101:3417:100210#/1 CCTGGATATTGTTTTTTCTAATAATGCCTATCACAAAAATGTATAAATGCCTTCGTATCATACTTTTTTAAAAACAACTGTCAATAATGAAAACTGAATG aa_ceeeegggggiiiiiiiihiiigiiiiiibgghiiiiheffhiiihehiihighhhiihiiiiiiggggggeaabddbdbcddccccccccbc_bcc 100 68.25 +XXXXXXXXXX:7:1101:2372:1994#/1 GCGGTGATGGTAGCCTTTCTGCCCAGCGCGTGCCACAGAGAAGGCTACACGAGCAGGATGCCATGCCCCAATACAGGCCACCTTGCGCAGGCCTCGGTGG ___ecccceceeggggfhghiiifggfgfigghf_fdgdgiffffffhhhhaggeeecdbbZ`]bbcbcc_cccbccac^^^`bcccac[_X[_^acW^a 100 64.27 +XXXXXXXXXX:7:1101:3452:100214#/1 GAAAAGGATGGAGGCAAATTTTAGCAGCAACCTCCACCTGACTGCTTGACTGGAGTGCTCTGAATTTTAACATTGGACTTCTCAGCACCACCAGCTGTTG a__eeecagegffhhihiiiiifffhiiihhhfhihhihbggegbbffghihihibgg`gfhhhecffgggdgegedeeedcdcddccccccccccc]Y] 100 66.98 +XXXXXXXXXX:7:1101:2677:1830#/1 NTCATTTTGTTTAAAAACTCGCTTGTCCCAGATTTGGCTATGGTACCAAGGTTTTTAACCAACTCTTCTCTGGTCATTCCTACACCGGTGTCTGTGACAT BP\cceeeggggehhiiiiiiiiihfhhiihiiifffiiifhfeeghgiiicfhihhhhhihhffhhhhggedggceeeeeeccddcccccbbcbccccc 100 52.71 +XXXXXXXXXX:7:1101:3354:100219#/1 TCTGGCTCGTCTGAGGGCACGGATGTCCTTCCCAATGCCTCGTGTGAGTTGGTAAGTATTGCCAGCTAAGGAAAGAAAGTTGGATATGTTCTCACCCAAA aabeeeeefegeehhiiihiiiihfgfhggdgighhfdhdfdfg\e_eeghhhhhideggeggeeeeedcbZ`b^^`bb_`bcbbbbcZ_`cbdbcc[`_ 100 65.63 +XXXXXXXXXX:7:1101:2603:1846#/1 NTCCACTCCTAGGAGGTCCCCAGAGTCCTCAGATTCAGAGACAGAAAGGATGGGGGACGGGCACAGTGGCTCACGCCTGTACTCCCAGCACTTTGGGAGG BP\cceeeeggfghfhcegihihffeffdhihhiihhhhhghfhhfhhib`fgffh`geecccccbbc^_accb``_^``bb`]^`^`acc`bbY^]`aa 100 52.59 +XXXXXXXXXX:7:1101:3600:100019#/1 GGAGAGGTTAAAGGAGCCACTTATTAGTAATGTTGATAGTAGAATGATGGCTAGGGTGACTTCATATGAGATTGTTTGGGCTACTGCTCGCAGTGCGCCG aa_eeeeegggggiiihiiiiiiiihighihihhiiihifhhiiiiiiiiiiihiigiiiiiihhhhighfghggcggddgeeeedddcccccccccccc 100 69.05 +XXXXXXXXXX:7:1101:2535:1848#/1 NGTAGCGTACCAGCCCAGGATGAGCTCATTTGGAGAAACTTTTTTATGCAGTTCATACATATTCTTAGCAAATTCCATGTCAACAGCCACTTCATCTTCT BSYcceeegggggiiiiihghiifhhhiiiiiifhhihghihiiihihfhiiihiiihiiihhigggfgggeeeeeeecdddddcaccccccccdcbcdc 100 52.79
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/r1_seqkit_fx2tab2.tabular Fri Jun 10 06:11:08 2022 +0000 @@ -0,0 +1,101 @@ +#id seq qual length avg.qual +XXXXXXXXXX:7:1101:1582:1835#/1 NGCTTCAGTTGGTACAGGTGTGTCACCCGTAGTTTGTAGGCTTGGAAGCCTGTAAGCTGTAGGGAACGTGGCAAGAACCAGATCTGGCCTTCCATATCTC BP\ccccc`eeccdeef_`fgabeghehdfhb^caefhee^efcehaeehhWabehddeM_eehhdeebd\^^a_]`___aaa`c]`Y^aaaaa_]]]aY 100 52.19 +XXXXXXXXXX:7:1101:1610:1859#/1 NTTATGTGTTACGTGAATCTCCTGAAGACAGCAGAAACTAGGTTGGTGAATTCTTATCCATTCTGCCATTCTGTATCTTTTAAGTGGAGCATTTAGGCTA BP\cceceggggggiihiiiiiiiiiiihihhiiihihiiiihiiihhiiihiiihhiiiihhiiiifhiiihgigggggggeeeeeecccddcdccbcc 100 52.73 +XXXXXXXXXX:7:1101:1743:1871#/1 NCGGGATGGAGGCAGGGCAAGCGGATGCAGGCCCAGCCCTGCCCTTACAGGTAGCTGGAAGTGACGAAGGAGTGGGGCCCCCGGACTCTGCTCAGGTGGA BP\ccceeggggghiiidfffhghfhhfffhhhidgggffbbghhheggeg`ccbccb_bdbdbbccaV^aaX^a`]X[_cca]]X]bc]Y]b`X`Y`_` 100 52.42 +XXXXXXXXXX:7:1101:1536:1878#/1 NGGCCTTTTTGGACAGGTGGTGTGTGGTGGCCTTGGTATGTGCTTTCTCGTGTTACATCGCGCCATCATTGGTATATGGTTAGTGTGTTGGTTAGTAGGC BP\cccedggggbffhieghdbgdeghffffhih[aaefdhefhhihhiiidffdffhgbbagaeebbdcddb_bcccbR]YXT]_`ab``[^b^]bcbb 100 52.41 +XXXXXXXXXX:7:1101:2990:100153#/1 GCCAGGAGTGACTGTGTTGTTCTTTGCTTTATATACATAAGCGCATCTCTTGCCCAAATAGAATTCTGTTTCATCTCGGGCGTAAACACCTTCAATTTTA ___cccecaegceg[dgfhgfbgdfgfhhfhhdfedhffhhhhhh[fhbbd_S^aaegfg`dfhgghhbcgddd``geadcc_a_a_][_c]bccccbba 100 64.07 +XXXXXXXXXX:7:1101:1624:1906#/1 NCCAGGTTTAAGGCATTACATCGAGGGGCTGAACTTGAGACAGTCCCTGAAAATGTAAGAACAGGAGCTAGAACTTGCTTATGGGAAGGGCCTAGGGAGA BP\cceeegggggiiiiihiiiiiiiiiiiiiiiiihiihihhiiiiiiifhiihhihdbfhggggeeeeddbddbdccccccbcbccccccccccccc_ 100 52.70 +XXXXXXXXXX:7:1101:1666:1926#/1 NGCAAACTGGTCAGGACCTGGAGCTGCTTGCCTGGCCTTGGCACAAGAGGCCGACATATGCCCAGCCCCTAGGAGTGACAGATCCGTCCTCTGTGGGAAC BPaceeeegggggiiiiiiiiiiiiiiiiiiihihiiiiiihiiiiiiiiiiiiiiiggggggeeeeccccccbbcaccccccccccccccccccccabc 100 52.71 +XXXXXXXXXX:7:1101:2921:100163#/1 CTCCGGATGCCAAAGGATCTGACAGTGTATCTAGCTTTGGAAAACACAGGGGTCTGCCCTGTGAGCTGCTCCAACACCTTGGCTGCTCGCGTCAGTCTGT bbaeeeeegggggiiihihhhiiiigheegfhhgdhihhhhhihhfhhhhbgggghihhdggihggeggeeeeeeacccccbccccccccc_a__bbccc 100 67.82 +XXXXXXXXXX:7:1101:1513:1929#/1 NCACTATCAAGGTTAGTGTCTATATCTACTTGAGANAAAATACTGAAAATTCAGTGTATGAAGCCAAATCCTGATTTAACAAGTTATTGGTAGTATAAGT BPY`acccceeeY`bfefeggehe`gddgceh_eWBPYbedeehfdefhhh]fhehbffhh_eeehded`cfhhdheeeeeeeddccccac`b]]ZZa`T 100 49.64 +XXXXXXXXXX:7:1101:2759:100170#/1 CTGCTCATCACATTCCAGATGCCATCACAGGCAATGACCATGAATTCATGGTCGTCAGTGAGAGTCAGCACCTTGATGTCAGGAAGGGCTGAAATCATCT bbbeeeeegggggiiiiihiiiiiiiiiiiiiiiiiiiiiiiihiiihiiihiiiiiighhiiihiiiiiiigggggggeeeeeddcccccabccccccc 100 69.31 +XXXXXXXXXX:7:1101:1708:1937#/1 NGGTCGGTGTCCTTTTTTGGCGTCAAACTTATAGAGGGAAGCAGGGAATCTACCCAACCAAAGCCAATGAACAGTCAGTCAGTCCATCTAGTTAAGGTTC BP\accccecggghiihihifhihffhihf`fegfghf`\ebcefgiigdgeggdeeec`abcbcbbbcbccccc`bccbccb```bbcccccc`bb`bc 100 52.64 +XXXXXXXXXX:7:1101:2981:100211#/1 GGGGTCAGTGGGAAAGGTGTCAATGGGACTTCGGTCTCCATGCCGAAACACCAAAGTCACAAACTTCAACTCCTTGGCTAGTACACTTCGGTCTAGCCAG __beccceeeeggdhffghhhhiihhcghffhiefaghhhfffffffhhiigifhf\cdbdddeeeebcbbd_bb_^bcbaccbcbbbbaa^a_]b`b`a 100 66.08 +XXXXXXXXXX:7:1101:1688:1946#/1 NCCGCCTTCTTTCTCTACTTCGTGACCTTTTGTGGTCCCGAGACCTGCTGCATCTTCTGTCTGATGTTCGGCTTGAGTGTCTACTTCCTGAACGACTTCT BPYac``c[cccchdd]caddeddehhhhhd`cdb^b]cc[^c_^_acccddchdhdcd\bdd]bd^bbbU\^BBBBBBBBBBBBBBBBBBBBBBBBBBB 100 38.51 +XXXXXXXXXX:7:1101:2767:100225#/1 CGCCTGGTGTCAATGCGCACATCTGGAGTTCCCATCTCCTTCATGGCAAATTTCCGAATCTCTTTGAGTGCCCGAGGTGCACGCTTCTTGAAGCCCACTC ___eceeefgggeiihihhhhihihihfgac_cefffihehiiiihhhhhfghhfhiehiihihf_ddbbgddcb`c]`bbbccccc`bb`b_bcccccc 100 66.85 +XXXXXXXXXX:7:1101:1536:1959#/1 NGATACTGTTGGGTCAGGACCAGGGCCTGCACCACCGAAATTCTGTCTTTTACAAACTGGACCAAGCGGTTGAGAATACAGGGGCCGAAGAGTAGGATTA BSYaa^ccggcg`d^dba_\ffh\[Zbf_aZ[c_cfY_ee`aeaf[\eefeghhffg_]\\`db^cdb`[ZWZR[`b]bbbbWELT]__TX^SYY]]]bb 100 50.36 +XXXXXXXXXX:7:1101:2797:100234#/1 GTGCTGGTCTCTCTCCACGATCTCTTACGTGCTAGCAGGGTGAACAAGGACGCCTCGCTGTCATTGCACTCACGCCACAGGAGCCTGGCACATTTCCGCT JY^accWceeeaWdcZ_feW`R^eg^a[HPP^_ef[d[Z_eUQX^ae_^Q\`ZSbUadVLKV_Z_Z_`]Z_baa^\WW^TGXTXWR^GW[][``BBBBBB 100 44.12 +XXXXXXXXXX:7:1101:1552:1976#/1 NTGATGAGTTTGCTAATACAATGCCAGTCAGGCCACCTACGGTGAAAAGAAAGATGAATCCTAGGGCTCAGAGCACTGCAGCAGATCATTTCATATTGCT BP\cceeeegegfiiiihiiiiiiiiiiihhiefgfhhhihifghdhhiiighfhhifihhiiiaghhigggggcdebdbddddcccccdedddddddcc 100 52.72 +XXXXXXXXXX:7:1101:1748:1978#/1 NCGCTGAGCAGGGCAGGCAGTGGTGGAGGCAGCCCCCCAAGACCCCATCTCTATCACAGTGAGAGCATCTGAACTCCAAAGCCACGACAGAACAGCTCCC BP\ceeeeggggghiiiihihiiegihhihiifiihhi`gfffggggeeeeeeddcdbd_bccbcccbccc`bbbbccccbccccccccaccbbb_`bcc 100 52.66 +XXXXXXXXXX:7:1101:2779:100239#/1 TGGGTGCTCTCCTTGGTCAGCTGCTGCTCGAACAGAGCACTTCTAGATACAGAGTTGGACCCAGACACAGCAGGGGTGGCCATGGCGGCTGGGAAAGACC ___^cc^ceggeeghddghafhXbegefbaYYbfhfgf_ae[egegc_cccaacaefg[bZbZ\\ZbZZ^gZZ^[]WW\_^bBBBBBBBBBBBBBBBBBB 100 40.42 +XXXXXXXXXX:7:1101:1593:1980#/1 NGGCACCAGAAGCATGAGCATAGGCAGAGCCATTTCCACCATGCTGACGGCAGGCAAGAAGAAGACAAAAATGAACCCCTTTCATGCTTGTTTAGAAATG BP\ceeeeggggfiiiiiiiihiihiiihfihhiiiifhhhiiiiihhiiiiiihhigggggeeeeeddcccccccccccccccdcccdccccccccccc 100 52.71 +XXXXXXXXXX:7:1101:2946:100242#/1 TGGGGATGTTGTTAAAAAAAATACAGGCTCCCCCACAACTGGGGTGCCTGGGGGGAACTTGGTCTGCTTCAGCCCAAGAGGAATCAAAAGATCAAAAGCA ___eecccgggggihhfhihfdfhhiihhiifiiddbcd`\eghL\^a^bdccccTTWRY`bRYYXSYb``bbca`acW^a`^bbccccc_bb`bbcbac 100 58.29 +XXXXXXXXXX:7:1101:1987:1781#/1 NTTAGCAGGTCCTCGTAGCGTTTCCGCAACTCTCGGAATCTGGAGTCTTCGGAGTGCAACTCTGAGGGTCCCGGGAAACTTGCGCGGCTCGCCTCGGCCA BP\cceeegggggiiiiihiiiihiiiiiiiiiiiiiiifiiiihhghiiihiggfgeeeeeebddcccccccccaccccccccccccccaacccXa^a[ 100 52.65 +XXXXXXXXXX:7:1101:3046:100006#/1 CTGTACAGCATGGATGTGGACAGGGAAAACAGCAAGTGCACACAGTGGGACAGGCCACAGGACAGGCTGGGAGTGAATAAAGAGTTCACACTGCTTCCCT bbbeeeeegggggiiihiiiiiiiiiiiiiiihiiieghiihhihffghiiiiiihiihhiiiggggeeec\bZ^bcbccc_]^]_b`bc`bbccbcccc 100 66.70 +XXXXXXXXXX:7:1101:1900:1788#/1 NCCCGCTGCCCACGCCACTGTCCCGGCGCTGCCCTGGGCGCGGAATGCGCGTTAGGCAATCCCCGGTCTGCGCGTCCCACACGCAGATGTGGCCTGCCAG BP\ceeeefggfgiiihiihiiiifhhiiihhiihiiihgeecccccccccaccccccccccccac_accca]aa[aacccccccccccdbccaccccb_ 100 52.64 +XXXXXXXXXX:7:1101:3214:100027#/1 GGCTGAGGTACTGAATGAGGAACAGCAGGAGGTAACGTCTGAGGGTGCGGCTGGGGAACGGTTTGCACAGGGGTGGCTGTAGGAGCAGGAGGTGAAACAC ___eecee^cegghhhhhhfhhfgfhhfhhhh^eggfcefhffhbU^eghhehgggTXZ\aTTX\RRYTT[GWROTWW[GG]YGXW[baOQEQW]b`]XW 100 49.49 +XXXXXXXXXX:7:1101:1848:1879#/1 NCTTCTTCTTCCTCATGTTTTTTGATCAACTGCTCCACTTCTTTTTGTTTGAGAACTCTGATTACTGTCTTTCCATTCTCTCTTGTTAGTGTTGCAATTT BP\cceeegggggiiiiiiiiiihhihhiehfhihhhiiihiiiihfghihdggfhhiiihihh_ddcggeefdb`beeeeeddcddbdbbcc`bbcccc 100 52.70 +XXXXXXXXXX:7:1101:3237:100032#/1 CTCCCGAAGTGCTGGAATTACAGGCATGAGCCCCCACGCCTGGCCTGATCAAGCTGTTTCTCTTGCTTGGAATGCCCTTTGCTGCCTGGCCAGCTCCTAG _b_eeeeegegggiiiiiihiiffegfhhihiiiiiighiffhiiiiiiiiihhiibdeggggeeeeeebcbdbcbcccccccccccccccccccccccb 100 67.87 +XXXXXXXXXX:7:1101:3027:100049#/1 CACAGAAACACGGGTTCATGATGGTGAATGATATAGCGGGTGACAGATGGCTACAAACCAGTCATAGGCCATCACACTCAGGAGCATGTCTCTCTTCCAT bbbeeeeegggggidghiihhihidgfhiihihfiiiiii_eghiiiihihhiiiggggeebdddcddddcccccbbcccccccccccbbdccccccbbc 100 67.75 +XXXXXXXXXX:7:1101:1756:1891#/1 NCGATGTTGAAGCCTGAGACTAGTTCGGACTCCCCTTCGGCAAGGTCGAAGGGGGTTCGGTTGGTCTCTGCTAGTGTGGAGATAAATCATATTATGGCCA BP\cceeegggggiiiiihiiiihiiiiiiiiiiiiiiiiiiiiigiiegghige]_ccaaccc_bbbbcccccc_bbcbcbccccdccccddddccccc 100 52.67 +XXXXXXXXXX:7:1101:3238:100065#/1 GGATGATAGAGTGTGGGAGAGAAAAGGGAGAGAGACTTTGGAGCTGAGTGGGGACCGCCGGGGAGGGGAGGCCTCAGAGTGGCTCAGCTGTAGATGCGGC bb_eeeeegggggdfgifhghhiiiiiihghhfgdhihiiifhhiiiigghiiiiigeecccc_accc_ccccbcbbbc_bccccbcbcc_bccdcbcca 100 67.15 +XXXXXXXXXX:7:1101:1915:1901#/1 NTAGAGGCTTACTAGAAGTGTGAAAACGTAGGCTTGGATTAAGGCGACAGCGATTTCTAGGATAGTCAGTAGAATTAGAATTGTGAAGATGATAAGTATA BPY`cceegfggfihgghhhegfghfgihdfhhhhhhfeffdgighiiiiifhiifdgdgecddc_cbbbdbbdcb__`bcc__`_`bbcbbccccac`c 100 52.64 +XXXXXXXXXX:7:1101:3198:100082#/1 CCCCCGCTCAACTACAAATGTCAATATTGAATGAAGCATTAAAAGACAAACATAAAGTAACTTCAGCTTTTATCTAGCAATGCAGAATGAATACTAAAAT b__eeeeeggggfiiiiiiieghhffhfhiiiiiifhiiiiiihgfhhiiiiiiiiigghhihiiiifegfggeeeeededcdcddcccccddcccbbcd 100 68.63 +XXXXXXXXXX:7:1101:1964:1931#/1 NGGGGTCTTAGCTTTGGTTCTCCTTGCAAAGTTATTTCTAGTTAATTCATTATGCAGAAGGTATAGGGGTTAGTCCTTGCTATATTATGCTTGGTTATAA BP\`Z`cdggggfhhhhghfghhhhhhhhhhffhhhhhhhhdggfhhhhhhhhghhhfgfceghfhhhhdgdgdggbggfgfebdeeeedcddbbccccc 100 52.70 +XXXXXXXXXX:7:1101:3088:100091#/1 TCCCACGTTTCCCACTTTAAAACAGAAGACTGCAGAGGATGTGGTAGAGACTGCAACTGCCAATGTAGCATCCGTTTTCCCAATTTCTCAGTAACAGGAT bbbeeeecgggggiiiiiiiiihffhihiiiiifgdghbghggighhhihhiiihiiiihiiiiihiiiiggggebcecdcbddcccdcdbccccccc`b 100 68.56 +XXXXXXXXXX:7:1101:1840:1948#/1 NCAGGGTGAGGGGCTTCGTCTGCTGGATGTACTTGTTGCCGAACTGAGTGACCCCCCGGGGCCAGCCGGTCTGCGAGCGATTGGGCGGTACCACAGACAT BP\ceecegggggiiihhhhiiiiiighhfhhiifhiiiiiiiiiiiihiiifhhgccccccacccccccccccccccccccccccccacaccccccccc 100 52.69 +XXXXXXXXXX:7:1101:3105:100094#/1 GGGAACTCCAGGGATGAACATGAGAAGGCCCTTCTGCTGTAGTACTAACTGCAATCAGTGTCTCGGGCTTCATGGGCTTGGCTTTACGTAACAAGCCAGG ^[[^ccccc^eccgf\R`bggfffbffhhfhbXc]Xcfcg]ece_cegfadafhgfheNWW\_]eZFZW`^HVZ]UZ`ZKZGT\b_b[KYXGY_XQWbW^ 100 50.33 +XXXXXXXXXX:7:1101:1958:1952#/1 NTCATGGTAGGGGTAAAAGGAGGGCAATTTCTAGATCAAATAATAAGAAGGTAATAGCTACTAAGAAGAATTTTATGGAGAAAGGGACGCGGGCGGGGGA BPY`cccc^aaecf`e[dbeeedaaeVefhhhdeXc_fehdb_eedhhhed\acbefdhdddee`bbeeeeeacca]_aa__]]_aaaaaa]aaa_]XaT 100 52.40 +XXXXXXXXXX:7:1101:3190:100106#/1 CACGGTTAGGGTACCGCGGCCGTTAAACATGTGTCACTGGGCAGGCGGTGCCTCTAATACTGGTGATGCTAGAGGTGATGTTTTTGGTAAACAGGCGGGG bbbeeceegggggiihhhihifhiihiiiiifgeghihhhhhfhgfecR]_bcccccdcccdc]b]bbccccbccc^`bc_bcccaccccccccacccac 100 64.50 +XXXXXXXXXX:7:1101:1993:1999#/1 GTTTAATTGTGGGAGGCTGAGAGCAGCATTTTTACCAAATTGGTGTAAAAATGAAACGGGGTCCAGACGTGTACACTGACAGTTACAGTAAATTTCAAAA bbbeeeeegecgfdhhiiihihiiiiiiiihiighihhfhihhcf_ehhhiiiiihihhggadgggeeeccddddbccccccccccccedccecccdccc 100 68.03 +XXXXXXXXXX:7:1101:3117:100110#/1 GTTTTATGTTGTTAATGTGGTGGGTGAGTGAGCCCCATTGTGTTGTGGTAAATATGTAGAGGGAGTATAGGGCTGTGACTAGTATGTTGAGTCCTGTAAG ___eeeeeggggfiiiigihghiibfcgefdgfhii`ghiefefhghhaedghdhibfghfhiff^`gbggeeeedbcbdbbbccdedcccbbbcbbbcb 100 67.19 +XXXXXXXXXX:7:1101:2159:1798#/1 NCTTCCAGTCCCCTCCTCGATTTCACACCGGGACACACACCTGGGTCAGGTGAGCATGACACACAGCCCCCAGGATGGGCACCCCACCCTGCAGAGCAGA BP\ceeeegggggiiiiiiiiiihiiiiiiiihhiiiifiiiiiifgiiiggggggeeeeeddccccaccccccccccccccccccccccccccbccccb 100 52.69 +XXXXXXXXXX:7:1101:3147:100111#/1 AGAAATTATTTTTAAATGTCAGAGAGAATGCTATTATTGGCCAACTTGAAATTTCCTAATTAGCTATCTGAGCTATTTAAGTCTGTACTTCAGTGTCTTC bbbeeeeegggggiiiiifiiiiiiiiiiiiihhiiiihhiiiiiiiiiiiiiiiihigiiiiiiiiiiiihihfcghhihbggggfgeeeeea_bdddd 100 69.60 +XXXXXXXXXX:7:1101:2152:1838#/1 NGGGAAACGCCATATCGGGGGCACCGATTATTAGGGGAACTAGTCAGTTGCCAAAGCCTCCGATTATGATGGGTATTACTATGAAGAAGATTATTACAAA BP\cceeegggggiiiiiiiiiiiiighigggggeeecccdccccdcceccccccccccccccccccccdccc^bbccccddccdcccccbcccddcccc 100 52.66 +XXXXXXXXXX:7:1101:3065:100152#/1 CACATAGTCAGCCTGCTTGATCACGTCGATCTTGTCCAGGAAGTACTGGGCACAGTCAATCAGCTGGTACTCGTTGGAGCGTTCGTAGCAGGCACGCACT ___ecacccggcgfhhhhhhh_gfdeghhhhhhhfhhdcdhXfX^f_eghhfUegbfh_be__dhbb`g`bga_aZ^]bdaX\^a^`aa`_[_aW]][]a 100 62.63 +XXXXXXXXXX:7:1101:2180:1843#/1 NTAGGGTGTAGCCTGAGAATAGGGGAAATCAGTGAATGAAGCCTCCTATGATGGCAAATACAGCTCCTATTGATAGGACATAGTGGAAGTGGGCTACAAC BP\cceecgggfehiehihhihhhhdffhihifdhhifghhhiiihihihiiihiiiiihiiihfhiffefgfdegeecac`d]bddbb_bcaacccccc 100 52.70 +XXXXXXXXXX:7:1101:3154:100159#/1 GTTTCATCATGTTGGCCAGGATGGTCTCAATCTCTTGACCTCGTGATCAGCCTGCCTTGGCCTCCCAAAGTACTGGGATTATAGGCGTGAGCCACCGCGT bbbeeeeegggggiiiiiiigiiiggiiiiififhiggiiiiifhiiiighiiiiiiiiihiiiiihhffffgggdgeeeeeedbdcaccaccccccaca 100 68.83 +XXXXXXXXXX:7:1101:2125:1861#/1 NGTGGGAGCAGCTGGCTGTGTGGCACCTGCTGTGGTGGCTGCTGGCGTGGCCGGAGTGAAGGGCAACGTGGCAGGTGCCGGGGGCTGGGCTGGATTCCCT BS\cceeegggggiiiiighghihfhifhhihfgfeghfbffgffaf_efffegX]Z]]_bccPZ^`aX`a]`acBBBBBBBBBBBBBBBBBBBBBBBBB 100 38.83 +XXXXXXXXXX:7:1101:3198:100173#/1 TGGCAGGTGGTGGTGGTGCTCAAAGAGCAGGTCCAGGTGGAAAGTGAGCACCGACAATGGCTGCAGCAGGAGCAGCAGCTCTGTGGACAGGGAGGGACAA ___cccccece`gbZaffgadfgg_ddffghbafffdaffffhhedghhhhhffhgggadc_`bbbba^a\\XXT^[^[Y_]`Y]b]`b__aaBBBBBBB 100 44.48 +XXXXXXXXXX:7:1101:2076:1911#/1 NGGAGTAGGAGTACCCAGTCTCTAGTGCCAGCTGCAAGCGTTAATTTGGTTAAAGTCTCCTTGATTGTCCTGTTCATTCTTTCTACCTGACCTGAACTCT BS\ceeeegggggiihiiiiihiihgiiihiiiiiiiihhhihghiiiihhiiiihihiihiihiiihhiiihfggggggeeeeabcdbdddcccccccc 100 52.81 +XXXXXXXXXX:7:1101:3166:100190#/1 CCGGCCGAAATTGTTTTTTAAATTTACGTGTCACCCTTCATGCAGGGCCCTGCTACTCTTCGTAGCCCTCCTCCATGTTTAGTGTGGGTGCGGCTGCAGC bbbeeeeeffgegdgigfiihhiiihiifggghffc`gfffgheifffagdbddgdbeced`bdcaccbaccccb`b`bccbY`bccaX]_accaa^R^b 100 63.87 +XXXXXXXXXX:7:1101:2196:1920#/1 NTGGGGTGGGTATGGCGGGGCCAGCCTTGCTCAGTGCTGTGGTGATGGCCACAGTAGCCTCGGGGGGCACAGCCACGGCTGGGGGAGCAGGCCCTTCCTT BP\ccc`ceeceehhhhhhh[aZZZ^U]LZ]]ZTZ_]]TTY_KTT]]`[a]_[[R]]R__aR[aaaaTEW^XP[GRLTTOOXaaBBBBBBBBBBBBBBBB 100 40.29 +XXXXXXXXXX:7:1101:3225:100207#/1 GCTATTTTCTGCTAGGGGGTGGAAGCGGATGAGTAAGAAGATTCCTGCTACAACTATAGTGCTTGAGTGGAGTAGGGCTGAGACTGGGGTGGGGCCTTCT bbbeeeeeggfgghiiihiYcghiihiihiififhfghfhhhhhhggggggeeeeeddddddcdcac]`ababbbbacccccccbcccc[aaacaccccc 100 66.30 +XXXXXXXXXX:7:1101:2115:1927#/1 NCTCCTTCTTGGCCTGGAGGCGCTCTTCACGGCGCTTGCGTGCTTCCTTGGTCTTAGACCTGCGGGCCTCAGCCTGGTCAGCCAGGAGCTTCTTGCGGGC BS\ccecegeeggiiiffggfhhiiiihhdhihfdghddfggeeeeecdddZ]bcdcbcccbccacaaccccccc^`YYYX`bW`_`a[`_b``_baccT 100 52.51 +XXXXXXXXXX:7:1101:3019:100219#/1 GGCGGGTTTTAGGGGCTCTTTGGTGAAGAGTTTTATGGCGTCAGCGAAGGGTTGTAGTAGCCCGTAGGGGCCTACAACGTTGGGGCCTTTGCGTAGTTGT _[^ccc_cggccgghdgcbgdf_WcXae[cbefffgbefh_d`dgddb]aaZTZW__cc`bb]ZZ_^aaZ]a^`b_Y__ab[`_XT_^bbbbaBBBBBBB 100 44.46 +XXXXXXXXXX:7:1101:2179:1937#/1 NAGGAATACATATAGTCATCATTGCCAGACTTAATATGAGAGGTGAAATGTTCGATCCAATTTTCCTTCCTGGATAAGTTTTTCTTTCCTATCCCTCTCA BP\cceeeggggghigfghiiiiiiihiiiiiiiiiiifhhhheghhiihhhihiiiiiiiiifhghhiiiiihhgffdgfgegeeeeeeeddcddcccb 100 52.73 +XXXXXXXXXX:7:1101:3202:100230#/1 CTGAAAAACAAAACAAAACTTAGCTAAGTTTTATGGCAAGTGGGGGCAGGGTCAGGTGAAGAGGTAGGAATTGCCTGAGGTTGGGGGTCCCTAAAACATA __aeeeeegggggihhhiiiiihihhhhfghhhihhhiihfffgdfhhihiddggeceeeeedcbbdcbbbcbcc]bbcc^abccccT[acbbcccb^`b 100 65.28 +XXXXXXXXXX:7:1101:2149:1945#/1 NGTGTGGTGGCCTTGGTATGTGCTTTCTCGTGTTACATCGCGCCATCATTGGTATATGGTTAGTGTGTTGGTTAGTAGGCCTAGTATGAGGAGCGTTATG BPYaccccegggghhhceghghhhhhhhhhfhhhhhhhhhhhhhffhghhhdffghghhbfghgfddgddcdddbebcbbbbbbbdcdbbbbaaaaaaab 100 52.67 +XXXXXXXXXX:7:1101:3211:100242#/1 CTGTTCCCCAATACCTGCAATTCACAGATATAATTTAGCATTTTTGTTTTTATATACTAATTTAGGCAAAACCCCCCCGCCACTGAATCGTCCAACAAAA ___`acacgggcghfdddc_gbggghddgfgfhhccdab[e[_Xbe^^cacdfgbaa[caSWWbfbf`efc_Zbg[XZaccaacccbcc[[WW^bbW[[a 100 61.18 +XXXXXXXXXX:7:1101:2169:1964#/1 NGGGAGCAAAAAGCGTGGGTACAGAAGCGAGAAGCGAGCTGAGTGGTTAGTTCAAATCAAGGCTTGGGGTATTTCCTGGTCATTTGGGGAACCTGAAACT BP\ccceeggggfehfhhh_fhifbgf[effhh`cfV__`gefccg`ddg`d`beeeadddbcccaaacNWY_bZ]`bb_YY__aGSTXGTW^R^R_b_` 100 50.12 +XXXXXXXXXX:7:1101:3168:100244#/1 CCCTTCCTGTGTCCATGTGATCTCATTGTTCAATTCCCACCTATGAGTGAGAATATGCGGTGTTTGGTTTTTTGTCCTTGCGATAGTTTACTGAGAATGA ___eeeeegegeghiihfbgghhhhfhaggiiiidbfhfhfbdegdfcffgdgfhhfhhfceefghicfffeeceddbddba^acc_bccccc[bbbcc_ 100 66.77 +XXXXXXXXXX:7:1101:3005:100246#/1 CAAAAGTTAAATGAAAAACCACAAGTTTAGTTTGACTCCGTCTCCTAGGGTGGATTTCATTCAGATATTTGTTCCATATTATAGGAGGGTGGATCCTAGC bbbeeeeegggggihhhihihiiiiiiiiihhihhhihiighiiiiihii^efaegfffhhfhhhiihhiidgggggdeeeeeeedccaZ\_accccccc 100 67.69 +XXXXXXXXXX:7:1101:2313:1789#/1 NTGCGCCTGGAAGCCGCCAGGCCGCAGCGCGGGGAACAGGGCGGCCACCCGGCTCAGCAGCCGCTCGCAGGGTCCCGGACCCGCCGCAGCCTCGGCTTCC BP\cceeegggggiihiiiiiihiihiiifhheccccccaccccccaccccccccccbcccccc_a]Zaaccbb`aaacaccaccccaaacccX]^^abc 100 52.58 +XXXXXXXXXX:7:1101:3253:100014#/1 GCGGATGATTCAGCCATAATTTACGTCTCGAGTGATGTGGGCGATTGATGAAAAGGCGGTTGAGGCGTCTGGTGAGTAGTGCATGGCTAGGAATAGTCCT bbbeceeegggggiiihihiiiiiiigfhiafbeccb_fdgaffhhhhhihihihhiieT]abcccccccccbb_WY]_bbbbccccccccbcbb`Y`bb 100 64.18 +XXXXXXXXXX:7:1101:2361:1794#/1 NGTTAGGCTCTCCACGACTGAGCTGGTCTCGGCACCAAGGGGGTCAGATTGCTTAAAGGCAAGGAGTTCAGGACCAGCCTGGGCAATGTGGGGAGACCTC BPYacceeegggfhhhhfhhfhhb_eaefdgghhfgfffgbfcfdeggfgeeeeeddbd\``aaabbbbdbbbb^[[^aba_aababb`_Y[aaaR[a`b 100 52.45 +XXXXXXXXXX:7:1101:2337:1794#/1 NGGGAAGGTGTCTGTCATCGTCCCCAGGAGGGAGGTGGCGTTAGCTGTTTGTCCTGTCATTAGGTTGGTAACTCTCCAAGTAACATTGAAGATCTGGTGA BP\c`ceceggggiihiiihiffffghi`ghhggi^ce`f_faghihbghigegdgR_ceeeeeU]`c^`_bcbbccbbb]`bcbcb`b`cbbbc_bbcc 100 52.47 +XXXXXXXXXX:7:1101:3284:100039#/1 TTGGGCGACAAGGACATGGAGCTGGAGGAGAGCGTGGAGGAGCGGCTGTTGAGTTCAGAGCCCGAGTCCACTGCCACCGAGGCCGGGCTGGCGGCCAGGG bbbeeeeegggggiihiiiiiiiiihhihiffhifhiihhifhigeec`db`bbccdcccbcccccacccccccc`bcc_acacccccccca_a[_BBBB 100 46.93 +XXXXXXXXXX:7:1101:2477:1795#/1 NGGCGGTGCACCGAGCTGGAGGCTGCCGCAGAGGAGGCGGCCGCCGCTGCGGCCATGTACGTGTAGGGGTAAGGGAACAGGCTTCCGAAAGGGGACATGG BP\ccccefeeggffghffhhihhhhhfifhhiidghfddcca_aWaWac_accabccdcaX`R^bba_X_bcccW`^acc_^[X`_[[[a_acacc]][ 100 52.30 +XXXXXXXXXX:7:1101:3310:100056#/1 GGGCGATTGATGAAAAGGCGGTTGAGGCGTCTGGTGAGTAGTGCATGGCTAGGAATAGTCCTGTGGTGATTTGGAGGATCAGGCAGGCGCCAAGGAGTGA bbbeeeeegffgfiihiihiighiiihiihhiii\edgfhiddggeggeeeedbddcdbdcccbbc^a`bcdccb`aabbaccb^acccacccca`cX`b 100 65.89 +XXXXXXXXXX:7:1101:2355:1821#/1 NTGTATTGAAGCCAAATTTCGTGCCAGGGTGGTGTTAGAATGTGAGCTATTTTCATTATATTTGGACTAGAATTTTTTCTTTTAGGAGAATGGTGGGGAA BS\cceeegggggiiiiiiihfgiihhii^egbffhfhfhhiehhhiihiiiiifgh`ffghiiighfhhgggfgggcdddddcbbbc`abcc_bcccac 100 52.78 +XXXXXXXXXX:7:1101:3420:100060#/1 GTGAAAAATGTTTAATTTACTTCAAAAATATCTTGCATAAGTATCTCATCCCTAAGCTCAAACAAACAAGAAAATTAAAGGCGGAAAGAATACATAAAAT ab_eeeeeggffgihhhihgfdhhhhihf]ghiihefhhig^fgbghbfdhhiihbffhhiihiiihhhhhcfhigfhdg`dFXZaccbcbcccddcbcc 100 56.56 +XXXXXXXXXX:7:1101:2418:1834#/1 NCGGTTTCAGTCGTCACTGCTGCCCCAGCCTTTCGCTGTCCTTCTTGCAAAAAGCTGCTCCCATCGGTATACCAGGTGTGGTCGGCGTCTGGGATGGGCT BPYcaceeggggfiiiiiiiihifiiihiiiiihdfhhfhfhiiiiihiihhhhhihihhiiegggeeecbeddcabbbcccccccc[aaccc`bccacc 100 52.67 +XXXXXXXXXX:7:1101:3267:100061#/1 CTGGGTAGTTCTGGCTCCGGGTCTCTCATGAGGTTGCAGTCACGATATTGGTTGGAGTTGCAGCCATCAGAAGGCTAGACTGCGTGTGAAAGACTCACTT _bbeeccegggggiiiiiihigghihifhiiiiffhiiihhihidghiihheghhhighgggfeeeeeeccddcccccccccccaacccdcccccccccc 100 68.01 +XXXXXXXXXX:7:1101:2378:1838#/1 NGCCCAACCAACAGCTTCAACAGCTATTGCAAGGTGCGCCAAAGGCATCTTGTCATCCCTCACACGAATCTCACTTCCTGTGAATTTGCAGGGAGGCAGA BP\ceeeegggggiiiihiiiiiiiiiiiiiiihfhiihiiiiiiiiiiiiiiiiiiiiiiggggeeebcddccccccccccddddcccdcccccccccc 100 52.71 +XXXXXXXXXX:7:1101:3416:100083#/1 GCCCAGTCCTGGGGGCAGGGGAGAAAGGGAGGGGTGAAATGAGAAGAGCCCCGTTCTTCCTCAGTGCTGGGGGGTTGGAGACACCACCCCCTTCTGCTGC ab_eeeeeggggfiiiiiiiighghhiiihhhiiL\bgeeeeeeddbddcccc^acacccccccbccccccccc]X_abcbcccaccacccccccccccc 100 61.17 +XXXXXXXXXX:7:1101:2481:1853#/1 NGCAGGTAGAGGCTTACTAGAAGTGTGAAAACGTAGGCTTGGATTAAGGCGACAGCGATTTCTAGGATAGTCAGTAGAATTAGAATTGTGAAGATGATAA BS\cceccgggggiiiiiiihiihhfhhihiiifhgiiiiiihiiiiiiiiiiiiiieggeeeeeebdddbddccbbccccccbbbccbcbcccccccdb 100 52.78 +XXXXXXXXXX:7:1101:3411:100111#/1 GTGGTGGCCTTGGTATGTGCTTTCTCGTGTTACATCGCGCCATCATTGGTATATGGTTAGTGTGTTGGTTAGTAGGCCTAGTATGAGGAGCGTTATGGAG babeeeeegggggghiihiiiiiiiihdfgiiiiiifiiiiiiihiiiiefhhiiiegfhggghgggfbddeceeedbdbb_bedcccccccccccccba 100 68.20 +XXXXXXXXXX:7:1101:3258:100128#/1 GCTGTGGCTTTTTTAAGGATAACTACCTTGGGGGCCTTTTCATTGTTTTCCAACTCCGGGATCTGGTCACGCAGGGCAAAAAAGCTCCGTTTTAGCTCGT _b_ecceeggggfihghifffhhfghidghhiihighiihighiighhiifdffggggeecccccbccbccccca[_aaccccccbbbcacbcbbcccc[ 100 66.63 +XXXXXXXXXX:7:1101:2252:1856#/1 NCAGAAATATGGCAGTGCCACAGAGAGTGTGTCCTCATTGGAGTACTTGCGCTTAAATTCATCCAACACAAAGGTACTCTTGGGCAGGTGAGCGAAGGGG BPYcaccce^ecc^e`begg_a_fXQ`[Q_eb_b`d]ee^[ac^e^e[cbe^edeedVWW_bb\_\dd`bdGV^aaab``UUG\\\]_T_]aaaZO[T]a 100 50.04 +XXXXXXXXXX:7:1101:3428:100129#/1 GTTGGAGTGTAGGATAAATCATGCTAAGGCGAGGATGAAACCGATATCGCCGATACGGTTGTATAGGATTGCTTGAATGGCTGCTGTGTTGGCATCTGCT ___eeac\cecggfhhihihfhhiiiihiiihfhffihhhhihhidg`fgfgeeccccZ^^\]bbbc_bb`bbccabcbb`ba[]`YbS]Q[RSRX`bb_ 100 60.12 +XXXXXXXXXX:7:1101:2394:1871#/1 NTTTATTTCTAGGCCTACTCAGGTAAAAAATCAGTGCGAGCTTAGCGCTGTGATGAGTGTGCCTGCAAAGATGGTAGAGTAGATGACGGGTTGGGCCAGG BP\ceeeegggggiiiiiiiiiigghiiiiiiiigihihhiiiiiiiihighiiiiihgeggggeeeeedddddb_bccbcccdcccccc_ccccccccc 100 52.70 +XXXXXXXXXX:7:1101:3387:100138#/1 TTGAGGGAGGGCAGACACAGGCTGAGGAGAGTGGATAGGAGCAGGAGAACCTGCCACACCCCACACCCCACTGAGAGCTCATCAGCTGCAGCCCTGGGCC bbbeeeeegggggiiiiiiiiPdgfhihhfgXafffhfhhhiiiicfgifhhhegegceeccccccccc_aacc``__cccccbbcccc`bcccc`accc 100 63.66 +XXXXXXXXXX:7:1101:2269:1904#/1 NGCACCTGTAATCCCAGCTACTCAGGAGGCTGAGGCAGGAGAATCACTTGAACCCGGGAGGTGGAGGTTGCAGTGAGCCAGGGTCAGGCCATTGCACTCC BPY`cceceaga^dadghhhgfhhbfghhhhhhhhfhgad`ec[ecedbbbecbdghgaaXKU^GZ\GTX`bRY]__bbT^aaRRWbb^a^]bbbbbb^` 100 49.98 +XXXXXXXXXX:7:1101:3444:100163#/1 TGTGGCTGTTCTATGAACCACCTTCTTCTTTCTGCGAGCAGTTCCTTTCCCACCAATGCGCACTTGTGCCTGCAGTTTGGCGAGGTTTTCCTGGGTCATG __\c\cc`^`c^be``bad`ddegaX`dgegfaIXW^^OW^O^ce]a^ae^egffgd_VZ_FT\ZV_]c`bb_bX]Z]R^baQREHW`WY_bYXGX^^BB 100 46.94 +XXXXXXXXXX:7:1101:2259:1943#/1 NTCTTCCTCATCTTCTTGTTCTTTTCTTTTTCCTTCTCCTTCTCCTTTTTCTTTTGTGACATGATTTCACTCTTGTTACCTACGCTGGAGAGCAGTGGTG BP\accc`b[QbKb`cd_``dedddcddYXecSbdI^P^XcSXbX^Y^^c^a^cc_HHXacIXWM\WWWa\HW_]NV\``_BBBBBBBBBBBBBBBBBBB 100 39.63 +XXXXXXXXXX:7:1101:3371:100179#/1 GGTTCTTCGAATGTGTGGTAGGGTGGGGGGCATCCATATAGTCACTCCAGGTTTATGGAGGGTTCTTCTACTATTAGGACTTTTCGCTTCGAAGCGAAGG abaeeeeegggggfgegheghii[eghiicaacccccccdccddccccccc`bbcccccccc[aacccbccdcddbccbccccccccccccccccc^aaa 100 65.77 +XXXXXXXXXX:7:1101:2371:1957#/1 NCCGTCGGAAATGGTGAAGGGAGACTCGAAGTACTCTGAGGCTTGGAGGAGGGGAAAATAGAGACCCAGTAAAATTGTAATAAGCAGTGCTTGAATTATT BP\cccccc^ggghbfdcghf^ecfghhhhhaffbgfd[egfcd_GWbfZcagU^N^`__ZZ_b^aaaa]]`bbc_RT]]b_b_SYXGJS_b]^bb`]_a 100 49.81 +XXXXXXXXXX:7:1101:3311:100186#/1 GAAGTGTCTGACTAAAGTCCGTTGCCCATTTTTTAATCAGGTTGTTCATTTTCTTACTGTTCAGTTTTAAGAGTTCTTTGTGTATTTTGTATGACAGTCC bbbeceeegggggiiihiiiihiiiiiiihiiiihhhhhhiefhhiihiiiiiiiihiiiiihhhghihhhffdddggggeedeeeedbdbddccccbcb 100 69.12 +XXXXXXXXXX:7:1101:2394:1961#/1 NCTGGAAGTGATGGTCCGGAACCGTTCCTGGCCCGCTGTGTCCCAGATCTGAAGTTTGATAGTTTTGCCATCCAGCTCGATGGTTCGGATCTTGAAGTCC BP\cceeeggeggifhiiiiihifhhihhffhiifgfffgfghihhhfhiihiigggefgeeceeeebbddbdcc`bcccccaY``aaacabcb[`bbcc 100 52.65 +XXXXXXXXXX:7:1101:3438:100192#/1 GGCGGATGAAGCAGATAGTGAGGAAAGTTGAGCCAATAATGACGTGAAGTCCGTGGAAGCCTGTGGCTACAAAAAATGTTGAGCCGTAGATGCCGTCGGA bbbeeeeegggggihiiifghhiihiighihiiiiihiiihihihiiiiiiiihiiifhhiefgggeeeedcdcc_acabbcccccacccbbbbcXa]a] 100 66.94 +XXXXXXXXXX:7:1101:2333:1962#/1 NGGTTGCTTGCGTGAGGAAATACTTGATGGCAGCTTCTGTGGAACGAGGGTTTATTTTTTTGGTTAGAACTGGAATAAAAGCTAGCATGTTTATTTCTAG BPYacccca]ee_c\egafbgfgghf]fhfdbg__a^efghaffcf`eghefhdghhdg^`[]a`bab]`bYb]b__bbbbabb__bcbbddbbbdbd`] 100 52.52 +XXXXXXXXXX:7:1101:3479:100209#/1 TAGAGGTGGGAACAAGAAAACATTGATATAGTTTTGAATTAACATTAAAGAGGCAAAATTTCACATTTAAAATGGCCCAAAATATCCCACTATTCATTTT abbeeeacgggggiiihiiiiiiiiiihiiiihihiiihiiiiiiiiiiiiiiighifgiiihiiiiiihiggggdgeeedcddeddccccccddddded 100 69.20 +XXXXXXXXXX:7:1101:2459:1990#/1 CGGGGAGGTAGCGATGAGAGTAATAGATAGGGCTCAGGCGTTTGTGTATGATATGTTTGCGGTTTCGATGATGTGGTCTTTGGAGTAGAAACCTGTGAGG a_beeeee`cggghiiiihhdfgfdhhiihiiihhiiihiffhifgefhifhhihfhggegeabcdaaddcdc`_`bcccccc[bbccccccccabbcb^ 100 66.80 +XXXXXXXXXX:7:1101:3417:100210#/1 CCTGGATATTGTTTTTTCTAATAATGCCTATCACAAAAATGTATAAATGCCTTCGTATCATACTTTTTTAAAAACAACTGTCAATAATGAAAACTGAATG aa_ceeeegggggiiiiiiiihiiigiiiiiibgghiiiiheffhiiihehiihighhhiihiiiiiiggggggeaabddbdbcddccccccccbc_bcc 100 68.25 +XXXXXXXXXX:7:1101:2372:1994#/1 GCGGTGATGGTAGCCTTTCTGCCCAGCGCGTGCCACAGAGAAGGCTACACGAGCAGGATGCCATGCCCCAATACAGGCCACCTTGCGCAGGCCTCGGTGG ___ecccceceeggggfhghiiifggfgfigghf_fdgdgiffffffhhhhaggeeecdbbZ`]bbcbcc_cccbccac^^^`bcccac[_X[_^acW^a 100 64.27 +XXXXXXXXXX:7:1101:3452:100214#/1 GAAAAGGATGGAGGCAAATTTTAGCAGCAACCTCCACCTGACTGCTTGACTGGAGTGCTCTGAATTTTAACATTGGACTTCTCAGCACCACCAGCTGTTG a__eeecagegffhhihiiiiifffhiiihhhfhihhihbggegbbffghihihibgg`gfhhhecffgggdgegedeeedcdcddccccccccccc]Y] 100 66.98 +XXXXXXXXXX:7:1101:2677:1830#/1 NTCATTTTGTTTAAAAACTCGCTTGTCCCAGATTTGGCTATGGTACCAAGGTTTTTAACCAACTCTTCTCTGGTCATTCCTACACCGGTGTCTGTGACAT BP\cceeeggggehhiiiiiiiiihfhhiihiiifffiiifhfeeghgiiicfhihhhhhihhffhhhhggedggceeeeeeccddcccccbbcbccccc 100 52.71 +XXXXXXXXXX:7:1101:3354:100219#/1 TCTGGCTCGTCTGAGGGCACGGATGTCCTTCCCAATGCCTCGTGTGAGTTGGTAAGTATTGCCAGCTAAGGAAAGAAAGTTGGATATGTTCTCACCCAAA aabeeeeefegeehhiiihiiiihfgfhggdgighhfdhdfdfg\e_eeghhhhhideggeggeeeeedcbZ`b^^`bb_`bcbbbbcZ_`cbdbcc[`_ 100 65.63 +XXXXXXXXXX:7:1101:2603:1846#/1 NTCCACTCCTAGGAGGTCCCCAGAGTCCTCAGATTCAGAGACAGAAAGGATGGGGGACGGGCACAGTGGCTCACGCCTGTACTCCCAGCACTTTGGGAGG BP\cceeeeggfghfhcegihihffeffdhihhiihhhhhghfhhfhhib`fgffh`geecccccbbc^_accb``_^``bb`]^`^`acc`bbY^]`aa 100 52.59 +XXXXXXXXXX:7:1101:3600:100019#/1 GGAGAGGTTAAAGGAGCCACTTATTAGTAATGTTGATAGTAGAATGATGGCTAGGGTGACTTCATATGAGATTGTTTGGGCTACTGCTCGCAGTGCGCCG aa_eeeeegggggiiihiiiiiiiihighihihhiiihifhhiiiiiiiiiiihiigiiiiiihhhhighfghggcggddgeeeedddcccccccccccc 100 69.05 +XXXXXXXXXX:7:1101:2535:1848#/1 NGTAGCGTACCAGCCCAGGATGAGCTCATTTGGAGAAACTTTTTTATGCAGTTCATACATATTCTTAGCAAATTCCATGTCAACAGCCACTTCATCTTCT BSYcceeegggggiiiiihghiifhhhiiiiiifhhihghihiiihihfhiiihiiihiiihhigggfgggeeeeeeecdddddcaccccccccdcbcdc 100 52.79
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/r1_seqkit_stats1.tabular Fri Jun 10 06:11:08 2022 +0000 @@ -0,0 +1,2 @@ +file format type num_seqs sum_len min_len avg_len max_len Q1 Q2 Q3 sum_gap N50 Q20(%) Q30(%) +13-1941-6_S4_L001_R1_600000_fastq FASTQ DNA 100 10000 100 100.0 100 50.0 100.0 50.0 0 100 100.00 100.00
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/r1_seqkit_stats2.tabular Fri Jun 10 06:11:08 2022 +0000 @@ -0,0 +1,2 @@ +file format type num_seqs sum_len min_len avg_len max_len Q1 Q2 Q3 sum_gap N50 Q20(%) Q30(%) +13-1941-6_S4_L001_R1_600000_fastq FASTQ DNA 100 10000 100 100.0 100 50.0 100.0 50.0 0 100 100.00 100.00
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/r2_seqkit_fx2tab2.tabular Fri Jun 10 06:11:08 2022 +0000 @@ -0,0 +1,101 @@ +#id seq qual length avg.qual +XXXXXXXXXX:7:1101:1582:1835#/2 GCAATGATGGGGCCGCTCCCGGGGCCACACCTGCTTCTGGATCCGCTGCTTCCAAGTTCCTTTGCCTCCCTCCTGGCATCACTGTCTGCGACTCAGGCCG ___ccc`cgegfedfhfhhhfdfec_eg`_fhfhiihiid`ggdadc`bd`b_bcccb__bbbbcbc_`cX^abbccbbccccccccbbXXaaccb`baa 100 64.29 +XXXXXXXXXX:7:1101:1610:1859#/2 CAATAACACAGTCCAAAATATATGTATGTATGTATATATATATGCAGGCAACAAATAGCACAATGAATAAAATAGTACTTCATCTCAGTACTAACATTGA b_aeeeeeggfgchhiiiiiihhighiighihiihfhihiiiiiehhiihhhhhiiihiiiiiiiihiiihiiiidfhhiihigggggbceeeeeedddd 100 69.64 +XXXXXXXXXX:7:1101:1743:1871#/2 GCTTCCAAGGGACAAAGTCCTGCCCTTGGGTGTGGAAGACACCGTGGACAAGCTCAAGATGCTGGAAGGCCGCAAGACCAGCATCCGCAAGTCAGTGCAG bbbeeeeegggggiiiiihhigdgihiiihdcfhhhihfffhihfdhhhhihhhhhgfggggeeeeeeeca]a_accbcccccccba^_acbbccccccc 100 67.25 +XXXXXXXXXX:7:1101:1536:1878#/2 TGCCTATCATATAGTAAAACCCAGCCCATGACCCCTAACAGGGGCCCTCTCAGCCCTCCTAATGACCTCCGGCCTAGCCATGTGATTTCACTTCCACTCC ___ceeeegfegfhiiiiiii`ecghbcegfhihhiddhifhifgihiihe```efaffeeegfgececeabacccc[`bcccb`cdccccbcY]bccbb 100 65.99 +XXXXXXXXXX:7:1101:2990:100153#/2 TGGAGGCCTGCTGGGAACGGGACTTCTAAAAGGAACTATGTCTGGAAGGCTGTGGTCCAAGGCCATTTTTGCTGGCTATAAGCGGGGTCTCCGGAACCAA ___cccceggecgiihffghighiiiiifffgidfhhiiihiiihiihh^\eeghgffhihggggeeb_aabbdcccccdbbcacacOXbccccaaa^^P 100 61.60 +XXXXXXXXXX:7:1101:1624:1906#/2 GGCTGGTCTGTCCCCTCTGCATCTGGGGCTCCTCCTGGCCCTTCTCCCGCTGCCTGTCCTGCCTCCTGGCCCTGCAGCAGCACCTTGCCCAGTGATCTTT bbbeeeeegfgggiiiiiiihiiihiiihihiihiihihiiiiiiffhiiefhifgghegggggeececddcccc^bcccccccccbbcbccbbbcbbbc 100 67.90 +XXXXXXXXXX:7:1101:1666:1926#/2 GGCTGTGGGAACTCTAGCTGCTGTCAGCCCCTCCTGTAGGAGCTGGCCCTGCCCAGGCTCCTGACTTCCCTCAGGAAGTCTTTCTGTCTTTCTCCATCAG bbbeeeeeggeggiihiiiiiihiiiiiiiiiiiiiiiihhiiiihiiiihiihiihhiiihgbggfgeeeeadd]_a]bcccbccccccccc`bccbbc 100 67.77 +XXXXXXXXXX:7:1101:2921:100163#/2 GAAAAGGAGAACCCCATGCGGGAACTTCGCATCCGCAAACTCTGTCTCAACATCTGTGTTGGGGAGAGTGGAGACAGACTGACGCGAGCAGCCAAGGTGT bbbeeeeeggfggiihiiiiiihhiiihhhfcghfhiiihii]ggfdggfdgeeeebcddcbacccaa]b_ccbcccccccccca_ac_acccacccY__ 100 66.10 +XXXXXXXXXX:7:1101:1513:1929#/2 AAAATGAGGGCCCGTAACAGAACCAGTGTGTGTATAACGAAAACCATGTATAAAATGGGCCTATCACCCTTGTCAGAGATATAAATTACCACATTTGCCT ^__ZZc]cegYZ^decYe[ed^ZbaeYcbf^ecS^ehfghfhiifefhef_effcghghfggfeeeeedbdc`cbc`b`]b``c`bccbcbb[`bccccc 100 62.67 +XXXXXXXXXX:7:1101:2759:100170#/2 GGTCACCATGGATGGGCGAGTCAACGGGGGCCTCAACCTCTCCAGAGCCATTGGGGACCACTTCTATAAGAGAAACAAGAACCTGCCACCTGAGGAACAG bb_eeeeegggggiiiiihifhhiiiiiihiiffggbdeeeeddddccccccccccccccccccccddccccbccccccccccccccccccccbcb^`ac 100 66.80 +XXXXXXXXXX:7:1101:1708:1937#/2 GAATACTTTGTGTTTACCCACTGCCCCCTGACCACTGCTGAAGGCAGAAAGGGACGATCACCTACAGTACCTGGTTTGGGTCTTTATTCTCTCATTCTAG a_aeeeeeggbeghihgfhfhhiiffhiifhhhfhffhiidhfhggiiiihghhiihigggfeadeebbddcbcZ_`^aa^`bbbbbbbb`bc_c`c`_b 100 66.38 +XXXXXXXXXX:7:1101:2981:100211#/2 TTCCTCCTAACTCCTGCCAGAAACAGCTCTCCTCAACATGAGAGCTGCACCCCTCCTCCTGGCCAGGGCAGCAAGCCTTAGCCTTGGCTTCTTGTTTCTG __aeeeeegacgghghhhhfff`cffhfhdghhhhiihhhd[ag`ggghfefhiiiihhghacffd`deeeZ]bb`abcbccb`bcbb``^_bcSY[_`b 100 64.03 +XXXXXXXXXX:7:1101:1688:1946#/2 GAGAAAGGGAAGAAAGAGAAAGGAAAAGACGAAGGGAAGAGGAAGAAAGAGAAAAAGAAAGGGCTCGTGACAGAGAAAGAAGAAAGAGAAGTCGTTCACG aa_`ceeegccg`ffgfgffgdgfhiihhihhiiii[egZefcdfdfgfhegdfhieeggeceedccaccccbbb`bbc`acccccbbbbcbbc_a^bcc 100 66.02 +XXXXXXXXXX:7:1101:2767:100225#/2 TGCAGAATGGCTCCCGCAAAGAAGGGTGGCGAGAAGAAAAAGGGCCGTTCTGCCATCAACGAAGTGGTAACCCGAGAATACACCATCAACATTCACAAGC ___eeeee[eeggffhihhfffhhh]HY^eeYefffhihihgbgggeabdZ`bcccccb`_[_caccbccbccccccccc_bbbc``_]`bb]]`__bP[ 100 57.32 +XXXXXXXXXX:7:1101:1536:1959#/2 GAGACAAAAATTGTTTGAATCAGGACAAGGGAGGTTTGAGGGACTGTTTAACAGGTCCCCATGGTTCACGACCCTGATATCCACCATTATGGGCCCTCTG _W_PY^Y\cc]c[bdJ`YJb^J`eJJJJQWPH^cHY^gc\efUGG^WW\beebgfV\_gg_X^RMHVVVQ^RKXZ`GGGT]ZT]aa``Y]bbc^W_acX` 100 46.90 +XXXXXXXXXX:7:1101:2797:100234#/2 GGAAACGCTGGAGAAGACAGTGTTGCTAGTCTGTTCCTGTTCGTGAGAATGCTTTGAATGGAGGCTCACTGTGCTGCGGCGGCTGCGGCCGTAGCGGGCG aP\JY`JO`YY`QJQ`Q`R`[JQ[^X[IPPXYXYPbbYccee[HWOONNXN]Wd\[HNW___UbGU\\VRV\\]]_BBBBBBBBBBBBBBBBBBBBBBBB 100 38.76 +XXXXXXXXXX:7:1101:1552:1976#/2 TGTGAGCACACCATATATTTACAGTAGGAATAGACGTAGACACACGAGCATATTTCACCTCCGCTACCATAATCATCGCTATCCCCACCGGCGTCAAAGT bbbeeeeeggggghhfhffhgihfggihdbfffgihiiiiiiiiifghiiffgfhhdghhichiegeeeee_bbbddbcccccbccca_accaaaccbc] 100 67.40 +XXXXXXXXXX:7:1101:1748:1978#/2 CAAGGAGCTGTTCTGTCGTGGCTTTGGAATTCAGATGCTCTCACTGTGATAGAGATGGGGTCTTGGGGGGCTGGGAGCTGTTCTGTCGTGGCTTTGGAGT a__eeeeegggggiihhighihiiiiihhiihiiiiihiiiihiiifgeffgghhhihii_fhhiihgecccccc`aacbbccdccca^accccbbcbc` 100 67.54 +XXXXXXXXXX:7:1101:2779:100239#/2 GCTGTGGTTACCTGTCCCCTGCCCCTGGCCTCCAGCCAGCTGCCAGTGGCCCCTCAGCTGCCTGTGGTGAGGCAATACTTAGCTAGGTTCTTAGACGGCC ^[^aaccde`c`^dbbeefdgchcaZZeaf]fcgefff`edgd^e_W^]eZbebd`cddf_ddg`deacdddcV`]b`bcdbc]b_`GT]]b_]`BBBBB 100 45.65 +XXXXXXXXXX:7:1101:1593:1980#/2 GGCTGTTCTCGAACTCCTGACCTCAGGTGATCTGCCTGCCTTGGCCTCCCAAAGTGCTGGGATTACAGGCGTGAGCCACTGCGCCTAGCCGTCACATTTC bbbeeeeegggggiiiiiiiiiiiiiieghhiiiiihhiiiiiiiiiiiiiiihghiiiiighiiiiiiigdddeddddcdbcccccccccacccbccdd 100 68.79 +XXXXXXXXXX:7:1101:2946:100242#/2 AATCCCTTCACCCCAGTTGCCAAACAGACCCCCCACCCCCTGGATTTTCCTTCTCCCTCCATCCCTTGACGGTTCTGGCCTTCCCAAACTGCTTTTGATC b_beeeeegggeegagggdhiihhhihhibffhhfhgghihf_cZcbd]]^`ddee__caGMZ]^Zbb_]\FKT[bb]`cbcbbc`]a^bcc]`bbbO]b 100 52.75 +XXXXXXXXXX:7:1101:1987:1781#/2 GCCGCAACCTGCACAGCCATGCCCGGGCAAGAACTCAGGACGCTGAATGGCTCTCAGATGCTCCTGGTGTTGCTGGTGCTCTCGTGGCTGCCGCATGGGG bbbeeeeegggggiiiiiihiiiiiiiiiiiiiiiiiihhihiiiiigggggeeeeeeddddddcccbbacccccccccccccccccccccc[_aacaac 100 67.28 +XXXXXXXXXX:7:1101:3046:100006#/2 GACGAGATGGAGTTCACCGAGGCCGAGAGCAACATGAATGACCTGGTGTCCGAGTACCAGCAGTACCAGGATGCCACAGCCGAGGAGGAGGGCGAGTTCG bbbeeeeeggggehiiiiihhihiihghhhiiihhiiifhiiihiihigfdgeeedddddcccccccccccbccccccccccccccccaccacc[aX_ba 100 66.53 +XXXXXXXXXX:7:1101:1900:1788#/2 CGGCTATGCGCCACCCGAGACGGAGATCGTGCCGCTTGTGCTGCGCGGCCACCTCATGGACATCGAGTGCCTGGCCAGCGACGGCATGCTGCTGGTGAGC bbbeeeeefggggiiiiiiggiiheghiigghhhiiihhhiiiiigeccc__ccccbcccccccccccccccccccccccccccccccccccbcc[^b_b 100 66.67 +XXXXXXXXXX:7:1101:3214:100027#/2 CACAACAACTGCTACTTCAGTTGCGCAGACAGTATCAACACCCACAACACAAGATCAGACCCCAAGTTCTGCTGTTTCAGTTGCCACGCCTACAGTTAGT _bbeeeeefeggghhiiihhghhhhhi[fhhf^cghiifhhiagiiiiihfbffggiiggggecdeZ`bdddcccccbdccccbcbcccccccbbcccc] 100 66.59 +XXXXXXXXXX:7:1101:1848:1879#/2 GGAGAAATGACCTTGAAGTCAGCACTTGCTTTAGCTATCAAAGTACTAAATAAGACCATGGATGTTAGTAAACTCTCTGCTGAAAAAGTGGAAATTGCAA bbbeeeeegggfgiiihighiiihiiihiiiihhiiiiiiiiighhiiihegghiihhiiiiiiiiiiiiiiiiiiiiiiigfgfgee^beddcdbdbcc 100 69.46 +XXXXXXXXXX:7:1101:3237:100032#/2 CGCTTATGCAGACAGAGCACAGCTGACTGCACGAACCAAAGGAGACGCATGAGCCAGAGAGACAAGGAAGGCTTTCAAAGGAAGGGATGGTCAAGCTGGG bbbeeeeefggggihiiihiiiiihiiiiiiiiiihihiiiiiiiihihifhdfgfgggfeeeeddcdcccccccccccccccaccccccbbbbcbbccc 100 67.97 +XXXXXXXXXX:7:1101:3027:100049#/2 CTCCACCACGGTCCCCAAGATGATTGTGGACATCCAGTCTCACAGCAGAGTCATCTCCTATGCAGGCTGCCTGACTCAGATGTCTCTCTTTGCCATTTTT bbbeeeeegggggiiiiihhihhhihfhhhiiihhiicfgiiiiidffdhighihhiiifihiiifgggfeeeeecdbdddcdcdccccccccc_bcddc 100 68.43 +XXXXXXXXXX:7:1101:1756:1891#/2 CTCATATGAAGTCACCCTAGCCATCATTCTACTATCAACATTACTAATAAGTGGCTCCTTTAACCTCTCCACCCTTATCACAACACAAGAACACCTCTGA bbbeeeeeggggfiiiiiiiiiiiihiiiiiiiiihhihiiiiiighhiihhhiiiiiiiihhghhiiiiiiiiiifgggggeeeeccdddccccccbbc 100 69.48 +XXXXXXXXXX:7:1101:3238:100065#/2 GGGGAAGGAAAACAGGGTATGGGGGAAAGGACCCTGGGGAGCGAAGTGGAGGATACAACCTTGGGCCTGCAGGCCAGGCTACCTACCCACTTGGAAACCC bbbeeeeegggggiiiidebhihihfihiihiiiiiiihhiihigeceeebcbdcccccccccccccccccccccccaccbccbcbccccacccbbb`ac 100 67.08 +XXXXXXXXXX:7:1101:1915:1901#/2 TACTCATTCAACCAATAGCCCTGGCCGTACGCCTAACCGCTAACATTACTGCAGGCCACCTACTCATGCACCTAATTGGAAGCGCCACCCTAGCAATATC _bbeedeegeeggihhicdhhhidghheegihhhhiiiiihihifiihhigiihiggdeeeedcdbdbdcccbcccdc`bbbccccccccccbbcbcccd 100 67.56 +XXXXXXXXXX:7:1101:3198:100082#/2 GTCAGCTTACATCCCTGAGCAGGAAAGTTTACCCATGAAGATTGGTGGGATTTTTTGTTTGTTTGTTTTGTTTTGTTTGTTGTTTGTTGTTTGTTTTTTT babeeeeeeegggihihiiiiiiiiiifhihhhihhhgffgihhhX^ege]eghiihihffdggfgededdbddccccbccab`b^^bccccccbcbaca 100 66.54 +XXXXXXXXXX:7:1101:1964:1931#/2 CCCAAACCCACTCCACCTTACTACCAGACAACCTTAGCCAAACCATTTACCCAAATAAAGTATAGGCGATAGAAATTGAAACCTGGCGCAATAGATATAG a__ecece_agfefgfghhhhhehhfeeghfffffhfgffcffddfghihfgffghhihhefddffhgd]cdddcdc`bcccab^^^_acaccccc_bcc 100 66.53 +XXXXXXXXXX:7:1101:3088:100091#/2 AACATCTTAAGTCTTACCAGCCAGAATGTAGATACATAACTACAGTTAGTTGTGGAAGCTTTGGGATTTTAGTTGAGTGCTATCATCCCCAAATGTCATT __aeeeeegfgeghfihiiiiihiighigfggifhiiiiihihhhfhiihgghghhihbdgiihiacehhghhhhhfZbdeggeeedacbdadbbbcdcd 100 67.89 +XXXXXXXXXX:7:1101:1840:1948#/2 GGCGGGCAGTAGCCGCTGAGGGGATTGCAGATAACCGCTTCCCGCACGGGGAAAGTCTACCCTGCCTGCCACTTTCTGCTCGCCGTCAGCGCCGGAGCTC bbbeeeeegggggiiiiifghiighiiiihhfhigggeeecddccccccccccccccdcccccccccccccccccccccccccccccccccacccaca^b 100 66.86 +XXXXXXXXXX:7:1101:3105:100094#/2 GCTTTGTCAAGCCCGCTCTGCTGCATCAGTAGTGAATGGAGAGAATTATTTTGGCAGGGCTGGGATGGAGTTCAGGTGCCCTTGCTTGTTACGTGAAGTC ^V^ccce`egeegh[b[dbafbcagacce^SXe`_caee^afbf]ac[I^dfaeefZaBBBBBBBBBBBBBBBBBBBBBBBBBBBBBBBBBBBBBBBBBB 100 36.74 +XXXXXXXXXX:7:1101:1958:1952#/2 CTTACTACTAATAATTATTACATTTTGACTACCACAACTCAACGGCTACATAGAAAAATCCACCCCTTACGAGTGCGGCTTCGACCCTATATCCCCCGCC bb_eeeeefgfgehhfhhihg]gfgfffgdghicegdhhhffgefhihiifhfgiiiif`fhffhh\dbdb^a^^b`_^aacN[_aaccbbd[]`_aX_a 100 62.07 +XXXXXXXXXX:7:1101:3190:100106#/2 AAAACACTGAACTGACAATTAACAGCCCAATATCTACAATCAACCAACAAGTCATTATTACCCTCACTGTCAACCCAACACAGGCATGCTCATAAGGAAA bbbeeeeegggggiiihiiiiiiiiiiiiihhiiihhiiifhiiihiiiieghhhihiiihfhhihiihhiiggggeeeeccdbcccccbc`bcbcbbbb 100 68.77 +XXXXXXXXXX:7:1101:1993:1999#/2 GCCCCCCGCACAGCCACCCGTGGGGTGCTGCCCTTATGCCCGGCGCCGGGCACCAACTCCATGTTTGGTGTTTGTCTGTGTTTGTTTTTCAAGAAATGAT bbbeeeeeggfggiiiiihhcffhh_e_dgfhgffgdcebecccccccccccccccccbcbccccdcc^^`acc`ccb_b]bbbP[^bc^_bbbcbcccb 100 63.20 +XXXXXXXXXX:7:1101:3117:100110#/2 AGGACTTCAAACTCTACTCCCACTAATAGCTTTTTGATGACTTCTAGCAAGCCTCGCTAACCTCGCCTTACCCCCCACTATTAACCTACTGGGAGAACTC bbbceeeefgfggiiiiihiihiihhiiiiiiihihefhiiihihihihifdhiihhiiiiiiiiiggeeedecccccccbcddccccccc\accccccc 100 68.17 +XXXXXXXXXX:7:1101:2159:1798#/2 CGGGCAGGGACCTGCAGGAGGCTTTCCCAGCAGGTGCACAGAAGGAAGCGCTGAGCCCACTGTGTGCAGAGGGTGTGTGCCCAGGGCACTGCCACGGCCC bb_eeeeegggggiiiiigiihiiiiiihiiiiiafghhehiiiihiiiifgigfggededdbdddcdccccc[_aacabbbcccccccbccccccccc] 100 67.04 +XXXXXXXXXX:7:1101:3147:100111#/2 CAAAATTTTGACAGGGAAGGAAGTAACTGCAAAACACTAGGCTTTAGTAGGTACTTATATAAAATCTAGTCCAGTTCTCTCATTTAAAAAAATGAAGACA bbbeeeeeggegghiighhihiibgfhiihhiiiiiiihihihiihhhhieeghiiihhiiihihihhhhiiiihfgcgggeeeeeeeddccccccbc`b 100 69.07 +XXXXXXXXXX:7:1101:2152:1838#/2 ATTCGGCGCATGAGCTGGAGTCCTAGGCACAGCTCTAAGCCTCCTTATTCGAGCCGAGCTGGGCCAGCCAGGCAACCTTCTAGGTAACGACCACATCTAC bbbeeeeegggggiiiiiiighiiiiiiiiiiiiiiiihiiiiiiiiiifhffhiggeccddccccccccccccaccccccccccbcccccacccccbbc 100 67.83 +XXXXXXXXXX:7:1101:3065:100152#/2 GGAGTGCGTGCCTGCTACGAACGCTCCAACGAGTACCAGCTGATTGACTGTGCCCAGTACTTCCTGGACAAGATCGACGTGATCAAGCAGGCTGACTATG __^cacccbeegghhiihhihihhhhchifdhfbgfhddffiibedffhhgffhiiiegfdggeeeca`bcddccaccaaaX^bbbbcc[^TW`W^``_b 100 63.71 +XXXXXXXXXX:7:1101:2180:1843#/2 ATCTGCTGCAGTGCTCTGAGCCCTAGGATTCATCTTTCTTTTCACCGTAGGTGGCCTGACTGGCATTGTATTAGCAAACTCATCACTAGACATCGTACTA bbbeeeeefgggghhhghihifiihgf_gfcdhhhiifhiihihiiighhhfffgdgfhiiihhhdffbfgffgeg^dcbeeeecdbbbdccccc`^`a_ 100 67.67 +XXXXXXXXXX:7:1101:3154:100159#/2 GTTTAGATAACCTCTAAGATCCAGCTTTAAAATTCTTGACTGAAGGCCTAACCTTTAGAAATATCTCGTTAGAGGCCAGACGCGGTGGCTCACGCCTATA babeeeeegggggiiiiihiiihiihiiiiiiiiiiiiiiiiiiiihiiihihiiiiiiiiiiiihihhiiihihggegeeeccc_cccccbccccaccb 100 69.02 +XXXXXXXXXX:7:1101:2125:1861#/2 CCCTCCACCACCTCTGTGGCTCCAGCTACCACATCTGGAGGCTTCTCATTCACTGGTGGAAGCACGGCCCAACCCTCCGGTTTCAACATTGGCTCAGCAG bbbeeeceggggfihihihhiiihhfihiihiihhhiihfhgfhhiififfhhfhhfghbghhcgggadcab^_^`ccaaW_]bbcbbbbbccbb]bcbc 100 66.16 +XXXXXXXXXX:7:1101:3198:100173#/2 CGCTTCCATGCCTTTATCCTGGGCCTCCTCAACACCAAGCAGTTGGAGCTGTGGTTTTCCAGTCTCCAGGAAGATGCAGGCCTGCTCTCCCTCCTGTACC _b_eccec`ggeehhihdfdgdf`dfhihfhhhhiiiihihhdgdhdfg_eecdebegfbdeadfdfhfgddaaadc_`accc\`c]bbcb^^abbYb`b 100 65.68 +XXXXXXXXXX:7:1101:2076:1911#/2 CCCAGGTATTGGGGACAGATAATGGGCCTGCCTTCATCTCCCAGGTAAGTCAGTCGGTGGCCAAGTTGCTGGGGATTGATTGGAAACTGCATCGTGCTTA abbeeeacggfggihihihiiiiihiiiiiiiiihhiiifiiiiiefhgeffgaehh`fhihgdgbgeeeeeccbacccd`bcbbbcbcbbbcaa_cccc 100 67.53 +XXXXXXXXXX:7:1101:3166:100190#/2 TGTGGTGGTTTCTCACAGCAGCCATGGGGAACGGAAGCGTCCCCAGGCCACAGCCTCCCCGCAGTGTGCGGACTCGGCCTGCTGAGCCTGCATGTTGGCG _a_ccacceeecghgfhhhcgfhigghhhiOb`g`ccbfcghhfbfcdgdcgbdegbcceccccW`Z]`^acccc^^a_accccccb^][[b_]SSGW__ 100 56.13 +XXXXXXXXXX:7:1101:2196:1920#/2 ACGGGGCTGTCTGCGTAAAACTTGCCACTTAGAGCCCTGCCTGCACCGTCGTCACGGCCCAGCCTGCAGGGTCGGGTGTGCTGACAGCCGGCTGTTAAGC abbeeeeegggggiihiifhiiiiiiiiiiihiiiiiiiiiifghiiiiifhhggfeeccacccccacccc`bacc^a_ccccccccccccccccccdbb 100 67.38 +XXXXXXXXXX:7:1101:3225:100207#/2 CTCCAACTCATGAGACCCACAACAAATAGCCCTTCTAAACGCTAATCCAAGCCTCACCCCACTACTAGGCCTCCTCCTAGCAGCAGCAGGCAAATCAGCC bbbeeeeegfgggiiihiiiiiiiihihfhhifghihihhiiiiiiiiiihghhiiihihhgggeeeeeedcdcdcbcccccccaacccbcaa^bcc__b 100 67.82 +XXXXXXXXXX:7:1101:2115:1927#/2 CGTGAATCTAAGAAGATCGATCGCCACATGTATCACAGCCTGTACCTGAAGGTGAAGGGGAATGTGTTCAAAAACAAGCGGATTCTCATGGAACACATCC bbaeeeadgggfghhiiiiiiihghiiiihehfgfhiffhifhhfiiigfegWbghfdghfhiigggfggeeeeecccccaacccccbccbcbc`bcccb 100 67.01 +XXXXXXXXXX:7:1101:3019:100219#/2 CCAACCTCCTACTCCTCATTGTACCCATTCTAATCGCAATGGCATTCCTAATGCTTACCGAACGAAAAATTCTAGGCTATATACAACTACGCAAAGGCCC a__accacagfaehihiffgh`efdcfff]gb`fgcfh_fffdfgg[abcdeghfhhfhcffffcedec_b_`dY_dcccdccccccbccaca[Xb`WW^ 100 63.93 +XXXXXXXXXX:7:1101:2179:1937#/2 CAAGAACAATAAATGTCTATCCTAATTTCAGACCCACTCCTAAAAACTCACTCATGGGAGCTCTGTGTGGATTTGGGCCCCTCATCTTCATTTATTATAT bbbeeeeegggggiiiiiiiihiiiiiiiihdhhhiiiiiiiiiiiihihgghiiiiiiiiiiiigiggidhggggfcedccccccccd_ceececdede 100 69.03 +XXXXXXXXXX:7:1101:3202:100230#/2 TGTACAAAGAGTAGCTGCCCCTTCTCAGGGCAGATGATGCTTTGAGAACATACTTTGGCCATTACCCCCAGCTTTGAGGAAAATGGGCTTTGGATGATTA _a_ceccea`aceggfhfihihiidhdh]e`eg^efgdhdhhihfhacgdefcgfhacbbegdffecga`ggeedb_c[`]_bbccaccccbccccbcbc 100 65.88 +XXXXXXXXXX:7:1101:2149:1945#/2 GCCTATCATATAGTAAAACCCAGCCCATGACCCCTAACAGGGGCCCTCTCAGCCCTCCTAATGACCTCCGGCCTAGCCATGTGATTTCACTTCCACTCCA bbbeeeeeggggfegghiiiihhiihififfhiiihihihiiihhihiihhhhiihhiigeffggeeecbbccccccccccdcccccbdcccccccb``b 100 68.03 +XXXXXXXXXX:7:1101:3211:100242#/2 TGAGGGCGTTGGGATGGCTTGTAGGATTTTTAAGAGAGGGTGTCTACAGACAAGCATTTTCTCTGTAGAGCAGCCACACGTTGTATAAACATAAACTTTA _a^ccccc_eeaeZ^bgg_cac[^^X^ccffg_a_fffGVaPZ_b]]e`c`cd``]db^]ZbZaZ]_b]]bbbBBBBBBBBBBBBBBBBBBBBBBBBBBB 100 38.61 +XXXXXXXXXX:7:1101:2169:1964#/2 CTAGGACAAGGGCCAAGAACCGATGGTACCCACCTGGGCCCCGGCTCAGGGCCAAGAACAGATGATACCCAGATAAGGCGGAACCAGCAACAGTTTCTGA bbbeeeeegfggfiiiiiiiihhiihhhiiefhihhiiiihiigiggegedceccccbccccccbcdcbbccacccc]]acccaccaccccccbcdcccc 100 66.99 +XXXXXXXXXX:7:1101:3168:100244#/2 ACTGGATTAAGAAAATGTGGCACATACACACCATGGAATACTATGCAGCCATAAAAAATGATGAGTTCATGTCCTTTGTAGGGACATGGATGAAATTGGA _bbee`eeeegfgiihigfghiefghgifhihdhiihiidghhffhcgehfd_^eafgiiihifhcgghhggeggfgeacdecbbcbccbbbbccccccc 100 67.61 +XXXXXXXXXX:7:1101:3005:100246#/2 CAGGGAGGGAGACACCTAGATTAGCAGCTCAATTTGTACTACTTCAGCCAATCTGTGAATTTAAAAACTACACTGTTGCCTTGCTAGGATCCACCCTCCT aabeeeee`gggghihiiihiiiiiiiiihiihiiihiifhiiiihiiiighiiiiihihiiiiihiigggggeeeeeddcdddddbaccbcbc`_cccc 100 68.54 +XXXXXXXXXX:7:1101:2313:1789#/2 GCTCGCCGCTCGCTATGGCGTCGCTCACCGTGAAGGCCTACCTTCTGGGCAAGGAGGACGCGGCGCGCGAGATTCGCCGCTTCAGCTTCTGCTGCAGCCC bbbeeeeeggggfiiihhihfhiiihiiihifdhghggggeeeeeddcdcdccccc\[`ccccccV_aaXZ]_bbccaa___ab_bbcccbb_Y_bbb`a 100 64.11 +XXXXXXXXXX:7:1101:3253:100014#/2 CAAAACTAACCCCCTAATAAAATTAATTAACCACTCGTTCATCGACCTCCCCACCCCATCCAACATCTCCGCATGATGAAACTTCGGCTCACTCCTTGGC bbbeeeeegcgggiiiiiiiihiiiiiiiiiiiiihVafhiiidhh[eggghdghhigfgggeeeeedddccccc_bcdcccccccacaccccccc_`bc 100 66.29 +XXXXXXXXXX:7:1101:2361:1794#/2 CGTGGTTCACTGCAGCCTCAACCTCCTAGGCTCAAGCAATTCTCCTACTTTCCTGAGTAGCTGGGACTACAGGCATGCGCCACCATACCCACCTAATTTT __^c^`c`cgeegghhhi`gghagihddgfegfhiihihfhihiiifghihghihhifhfbcggcdecghagggggebccc`a`^b_bb`bcaaRYY]bB 100 52.68 +XXXXXXXXXX:7:1101:2337:1794#/2 CGACAACTCCTCCGGCCGGAACAGCATGGAAGGTCCAGCGTTCTCAAAATCCCTTAAAGATAAGATTAACCCGTGGGGCCCCCTAATAGTTATGGGGATC ab_eececggegehhhhhfghfffgbgffihefWbafbg`_cghhdbdgg]_bccdcdbb`_bb]b`_bcc^\WNZLXTT[acaabb]`GYY`]`W^GEW 100 51.43 +XXXXXXXXXX:7:1101:3284:100039#/2 TTCCTCAATCTGAACACCATGCGCCCGCGGCTGCGCTACAGCCCCTACTCCATCCCGGTGCCGGTCCCGGACGGCAGCAGTCTGCTCACCACCGCCCTGC bbbeeeeegggggiiiiiiihhghghhfiihiidgfhfgfegeeeecdddbccccccccaacccZaccccacccccccc_bccccccccccacccccccc 100 66.60 +XXXXXXXXXX:7:1101:2477:1795#/2 GGCCTGGATTCCACGGCCATGGCCTCTGCCGCTGCGGCGCAGGGACTGTCCGGGGCGTCCGCGGCCACCCTGCCCTTCCACCTCCAGCAGCACGTCCTGG ___ceee^ceegfifhfhcfhhiihhihhffgghiaffZd]a```cccccbaaacacaZ_acVZ]aac^ZWX`aabb[X]Y^aaW``]b[`a_TW`^WSX 100 60.46 +XXXXXXXXXX:7:1101:3310:100056#/2 CGCAAAACTAACCCCCTAATAAAATTAATTAACCACTCATTCATCGACCTCCCCACCCCATCCAACATCTCCGCATGATGAAACTTCGGCTCACTCCTTG bbbeeeeegggggiiiihiihiiihihfhhiiihiiiiihiiiiihhiiihhfhhiiiigggdeeeedddddccccccccdcccbcbcccccbbb]bcbc 100 68.01 +XXXXXXXXXX:7:1101:2355:1821#/2 GTCTTCGTCATGCTCAATGAAAATGTACTAAGTTCTCCCTCTGTGCTAGTAACAGTGATTCCCCACCATTCTCCTAAAAGAAAAAATTCTAGTCCAAATA aaaeeeecgggggiiiiiiiiihiighiihiighhiiiiiiiihiihiffeghihghiiiiiiiiiiiiiihiiiifggggggeecddcdccdccccccb 100 69.29 +XXXXXXXXXX:7:1101:3420:100060#/2 CCCAGAAAGGCTATTTTCAGATGAAATCGATATTAGAAGCTATATTAGCTGAAACAACTCCTTTTACTGCGTAGAACCTATATCGAGAGTGTGTGTATAT bbbeeeeecfgggehifhiiihhfhihhiffhhhhhdfgfihhihiiihgfhhihiiiihiihhiiihhi]dgeg`gceeeedccca^aZ]_bQ^[_acb 100 64.38 +XXXXXXXXXX:7:1101:2418:1834#/2 GGTGGCCCTCAATCCTGCCACCTTGCTCCCTCTACCGGAAAAAGGAGCCCCCCATGATTGCCTCGAGATCTTGGCTGAAACGCATGGAACCAGACCGGAT ab_ceeeeggggghiihihiiiiiifhiiihffgiiiifhiihfiiiiiighgaeeeedddddcccccaccccccccacccccaac^]_bcccacca[aX 100 66.17 +XXXXXXXXXX:7:1101:3267:100061#/2 GCCAGCTGCATGTTGTGAGGACACTCAAGCAGCTTTTTGGAGAGGTCCCATGGTGAGGTATTGAGATTTCCTGCCAATGTCCACATGAGTGAGCTCCCTT bbbeeeeeggggegigfihidfdiiiiiihfhhhhiihighhhhighiiifghfghghbeghihihegfbgggeeeeedddcdbbccccbbcccbccccc 100 68.35 +XXXXXXXXXX:7:1101:2378:1838#/2 GCTTGCTGCTGCTGGAGGTGTTTCCCATGATGAATTGCTTGACTTAGCAAAGTTTCATTTCGGTGACTCTTTATGCACACACAAAGGAGAAATACCAGCT bbbeeeeeggfggiighi`deghiiiiiiiiiiiiihihiihiiiffihiigfghihiifhhihihhhiiiihgggfggeeeccddcccccccccccccb 100 68.88 +XXXXXXXXXX:7:1101:3416:100083#/2 TGATCAACATCTTTTCTTGCCTCTGTCCCCTTCTCTCATCTCTTAGCTCCCCTCCAACCTGGGGGGCAGTGGTGTGGAGAAGCCACAGGCCTGAGATTTC b_beeeeegggggiiiiihiiihfhiiihiiiiiiiiiiiiiiiihhhiffghiiiiiiiihia`]accbccbaaa^bacccccbbaac_^ccccbbbcb 100 67.08 +XXXXXXXXXX:7:1101:2481:1853#/2 GCCTACTCATTCAACCAATAGCCCTGGCCGTACGCCTAACCGCTAACATTACTGCAGGCCACCTACTCATGCACCTAATTGGAAGCGCCACCCTAGCAAT bbbeeeeegggggiiiiiiiiiiiiiiiiihiiiiiihiiiihiiiiiiihiiiiggggeeeedddcdcccccccccccdcccccacccccccccccccc 100 68.19 +XXXXXXXXXX:7:1101:3411:100111#/2 CACATGCCTATCATATAGTAAAACCCAGCCCATGACCCCTAACAGGGGCCCTCTCAGCCCTCCTAATGACCTCCGGCCTAGCCATGTGATTTCACTTCCA bbbeeeeegggggihihiggiiiiihiiiiiiihhihihfhiihhfiihdaghiiiiiiihggggeeeeeeddcccccccccccccbbc_bc__bbbbcc 100 67.87 +XXXXXXXXXX:7:1101:3258:100128#/2 CCAGCCCCAGGTCCTCGGACACCGAGGAGAATGTCAAGAGGCGAACACACAACGTCTTGGAGCGCCAGAGGAGGAACGAGCTAAAACGGAGCTTTTTTGC _bbeceeegfggghfhhiihhhiidgf`gfhdh^effcebeghgdcedcc`^_aaa[^bbbbca]_Vaacaccc^W^_a_X_b`b``[^_aT[]`bcaX` 100 62.43 +XXXXXXXXXX:7:1101:2252:1856#/2 GAAGGGTTCACGGGAAGAGAAGCAGAAGCCCCAGGCTGAGCGGAAGGAGGAGAAAAAGGCGGCTGCCCCTGCTCCTGAGGAGGAGATGGATGAATGTGAG __Zc``cccagaefhihicggffffffdf]bcdP^aXaQaeghhghcddgPTZZ__GX\ZX_Zaa^`^[W[abb]]]GRWY[XGGGRY]RY_Y_Y_bc[b 100 50.14 +XXXXXXXXXX:7:1101:3428:100129#/2 CAGTTCTTCAAATATCTACTCATCTTCCTAATTACCATACTAATCTTAGTTACCGCTAACAACCTATTCCAACTGTTCATCGGCTGAGAGGGCGTAGGAA a_bceceeegegghhhhiiffffhfiiifihhihhhhffghiiibghidgccgeghhhhidghffhiifihhhfhgegcfggeeeccccca_aa_\]^b` 100 67.40 +XXXXXXXXXX:7:1101:2394:1871#/2 GCTAAATAAGCTATCGGGCCCATACCCCGAAAATGTTAGTTATACCCTTCCCGTACTAATTAATCCCCTGGCCCAACCCGTCATCTACTCTACCATCTTT bbbeeeeegggggiiiiiiiiiiiiiiiiiiiiiifhiighiiiiiiiiighiggggggeeeeeeddcdccccccccccccccccbbcdcccccccccbc 100 68.16 +XXXXXXXXXX:7:1101:3387:100138#/2 GCCAGGCCTGCCAGGGAGGCCAGGGCTGACTGCTCTTCCCCTCCCATGGCTGGTGCCCAGCCCCCCCCCCCCCCCCCCCACAAACAAGGGGCCCGGCCCC bbbeeeeegggggihifhihihiiihiiihefhfhhhhiiiiiihfdW\ebdgZc`ggbdgeeecccccccBBBBBBBBBBBBBBBBBBBBBBBBBBBBB 100 38.37 +XXXXXXXXXX:7:1101:2269:1904#/2 AAAGGAGGCAGATGGGTCCTAGAGGCAGCCCATGGCAAGGGAGAGGTCTGCTTTTTTCTTTTTTTTTGAGACGGAGTTTCACTTTTGTTGCCCAGGCTGG _[_c`Za]ecceghfeeae`Xecee^bghffccgfdf]egfggOacM\Zeefbd]_[bg]bcc[]aaZ^ccY[OETJR]Y]_YS]`YJRWSSGJQ[[`aB 100 48.61 +XXXXXXXXXX:7:1101:3444:100163#/2 CGTGTGTGCGCCTAATCTCAGGTGGTCCACCCGAGACCCCTTGAGCACCAACCCTAGTCCCCCGCGCGGCCCCTTATTCGCTCCGACAAGATGAAAGAAA aaYY\YQ\\_Y[[behifh`afQXebdefd^^U__U_cac^\aeg_edgf\Z_\^`]\bRZZ\[_^WWZTTXX`ab]bY^T_`Xa[ET[Q^_`bb]]b`[ 100 53.54 +XXXXXXXXXX:7:1101:2259:1943#/2 AAAAATTAGCTGGGCATGCTGGCGCACACCTGTGGCTCTAGCTACTCGAGGAGATGAGGTAGAAGGATCACTTGAGCCCAGGAGTTGGAGCCACAGTGAG ^__aaca`beacg`^`bb_dg]bcgdgHPY^e^cgcaefffhdc`c[Ze``TbUV\HV`M\a^aZaUZ`]]bbcR]]^^^`_[WKY]]b^BBBBBBBBBB 100 42.61 +XXXXXXXXXX:7:1101:3371:100179#/2 CCGGAATGCCCCGACGTTACTCGGACTACCCCGATGCATACACCACATGAAACATCCTATCATCTGTAGGCTCATTCATTTCTCTAACAGCAGTAATATT bbbeeeeegggggiiihiiiiiiihiiiiifhiehhiiiiiiiigggfeeeeeeddddddccdcccccbccccccdddddeddccdbccccccbcc`bcb 100 67.68 +XXXXXXXXXX:7:1101:2371:1957#/2 CGCTAAATCCCCTAGAAGTCCCACTCCTAAACACATCCGTATTACTCGCATCAGGAGTATCAATCACCTGAGCTCACCATAGTCTAATAGAAAACAACCG _b_eeeeecefgghfhiihhfhiiidfhhhdfhhii_ghhhiihieihhhdfghihheghiihhfgggfb]aceab`a]]bb`ccccdcb`bbccccccc 100 66.91 +XXXXXXXXXX:7:1101:3311:100186#/2 AAGTAATTGATAAGCTGGACTGTGCTAAAATTAGAAATATCTGCTCTGTGAAAGACAATGTCAAGAAAATGTAAAGACAAGCTACAGAATGGGAGAGAAT _b_cceeegggggiiiiifhiighihiiiiiihiiiiiiiiiiihiiigifghiihiiiiiiiiiiihihigghhihiiiigfgggebeeeeddcbcacc 100 69.35 +XXXXXXXXXX:7:1101:2394:1961#/2 CCCGAATATGACTACCTGTTTAAGCTGCTTTTGATTGGCGACTCAGGCGTGGGCAAGTCATGCCTGCTCCTGCGGTTTGCTGATGACACGTACACAGAGA b__eeeecgggggiiiiihhifhghhhhhiiiifiiffhihiihfhaffff]`gbgggggfgecbeeddddbbac^\_abb_bbbbbbcc`^accccb^[ 100 66.13 +XXXXXXXXXX:7:1101:3438:100192#/2 CCTGAGCTCACCATAGTCTAATAGAAAACAACCGAAACCAAATAATTCAAGCACTGCTTATTACAATTTTACTGGGTCTCTATTTTACCCTCCTACAAGC bbbeeeeegfggfiiifgiiiiiiiiiihiiiihgfhiiiihiiiiiiiihhfhhiiiiiiiihifheggggfeeeccbdddcddccccccccbcbcbcc 100 68.74 +XXXXXXXXXX:7:1101:2333:1962#/2 CAACCCGTCATCTACTCTACCATCTTTGCAGGCACACTCATCACAGCGCTAAGCTCGCACTGATTTTTTACCTGAGTAGGCCTAGAAATAAACATGCTAG ^a_ccc^O[beeedfh`e_gdffgdc]cedcehdR^e^RcfhhdcX^e`gafbfffa_FTS^RMMM]_aZ]Z]``XY]RTGTGY[bbb`bcb`__b`Y`_ 100 51.00 +XXXXXXXXXX:7:1101:3479:100209#/2 CCAGAAACTGCTAAAGAACATGGCCTGTTTGACATGTTCATGAGTCACCTGACCCACAGCATATATGCTTATGACTAAACCCTCCACTCCTGATTCTCAA bbbeeeeegggggiiiiihihiihiifeghfgiihhchghiiiheghiiihiiiiiiiiiiihiiiiiihiihiicgggggeeecddddcccbcccccdc 100 69.18 +XXXXXXXXXX:7:1101:2459:1990#/2 CCACAACCTTAACAATGAACAAGATATTCGAAAAATAGGAGGACTACTCAAAACCATACCTCTCACTTCAACCTCCCTCACCATTGGCAGCCTAGCATTA bbbeeeeegggggiihhiihiiiihfghhiiiigegfhfghiiiiiiiihihhhhiihihhhiiiiiggfdggeeeedddcccccccccccccccccccc 100 68.75 +XXXXXXXXXX:7:1101:3417:100210#/2 GCAGACTACTACTATGGATAACTACAGTGCGATTCGTTCATGACTGAGCGTGGAGCAGAGTCCACACAGAAGTTGATCGTGGTACCCAAGGCTGCTTCTC bbbeeeeegggggiiiiiiiiiiiiiighiiiihiihiiiiiiiihifiiighhiiihiifgiiiggggeee_cedcdcdcc``ccccccccbccccccc 100 68.39 +XXXXXXXXXX:7:1101:2372:1994#/2 GTTTGGGCAGGATGAGATGATCGACGTCATCGGGGTGACCAAGGGCAAAGGCTACAAAGGGGTCACCAGTCGTTGGCACACCAAGAAGCTGCCCCGCAAG _^^c`ccabee`ca]f[dd[]J`dPbbedX_gghiOVUbf]_bfg_d\db^Z^_`_`b_b__NFXT_]`TYWWXX`YY]X^^^`W^`bccbbcccX]cBB 100 48.35 +XXXXXXXXXX:7:1101:3452:100214#/2 CGTTTTTGGAAACCAGTGCTAAGAATGCAACGAATGTAGAACAGTCTTTCATGACGATGGCAGCTGAGATTAAAAAGCGAATGGGTCCCGGAGCAACAGC bbbcecccgeggghiidcggfhhdfhhbffehhhhi]ccfghiicfffffbcfbegba_efgfhhgc^dggccee[R`[_^NGYQYR[a^a]_[`X^`^a 100 55.72 +XXXXXXXXXX:7:1101:2677:1830#/2 TGAAAATGCTCTTTCTGGAAATGAGGAACTAACAGTCAAAATTAAGTGTGATAAGGAGAAGAACCTGCTGCATGTCACAGACACCGGTGTAGGAATGACC bbbeeeeegggggiiiiheghhhihhiihhhhfhighiiiiihifhefhghhiiiiiiiiihiihihhhiiiiiiigfggfeeeecc^a_ccccbccccc 100 68.81 +XXXXXXXXXX:7:1101:3354:100219#/2 ACAGCCGCTTTGACCGGGATTACCAGCAGTACCATGGACTACGGAAAGAAGTGGTGGACACAAGCCCAAGCCCACGACCTGGTCATCAAAAGCCTTGACA bbbeeeeegggggiiiiihiiiiiiiihighhiiiihfiihiihfghibgggggdgeceeedcdbaaaaaccc`a__accccbbccccccccccccbcbb 100 67.23 +XXXXXXXXXX:7:1101:2603:1846#/2 GCTAATTTTTGTATTTTTCATAGAGACAGGGTTTCACCATGTTGGCCAGGCTGGTCTCGAACTCCTGATCTTAGGTGAGCCGCCCGCCTCAGCCTCCCAA bbbeeeeeggfegiihhhhifihiifiiiffbfhihdcghfehheghhhhhfhh`efhhaegihihfcfhiigffdgdceecccc\^cccccbbbcccbc 100 67.68 +XXXXXXXXXX:7:1101:3600:100019#/2 CCCCTGGTCAACCTCAACCTAGGCCTCCTATTTATTCTAGCCACCTCTAGCCTAGCCGTTTACTCAATCCTCTGATCAGGGTGAGCATCAAACTCAAACT bbbeeeeeggfggiiiihiiiihhiiiiihiiiiiiiihihihhghihiigghhhhhhfgfhihiiiiiggggggeeeecc]^`dbbccccccccccccc 100 68.39 +XXXXXXXXXX:7:1101:2535:1848#/2 CCCGAGTTATCGGGACCCTGTTGGGAACTGTCGACAAACACTCAGTGGAGGTCACCAATTGCTTTTCAGTGCCGCACAATGAGTCAGAAGATGAAGTGGC _bbeeeceggggfhihiihihiihiihiiihhhiiiiiiiihiiifhhhigggggggeeedeedddccddcccccZZ\X`bbcbccbccccccc_Y_bcc 100 65.68
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/r2_seqkit_stats2.tabular Fri Jun 10 06:11:08 2022 +0000 @@ -0,0 +1,2 @@ +file format type num_seqs sum_len min_len avg_len max_len Q1 Q2 Q3 sum_gap N50 Q20(%) Q30(%) +13-1941-6_S4_L001_R2_600000_fastq FASTQ DNA 100 10000 100 100.0 100 50.0 100.0 50.0 0 100 100.00 100.00
--- a/test-data/samtools_idxstats.tabular Mon Dec 06 18:28:04 2021 +0000 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,2 +0,0 @@ -NC_002945.4 4349904 45 4047 -* 0 0 5
--- a/test-data/samtools_idxstats1.tabular Mon Dec 06 18:28:04 2021 +0000 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,2 +0,0 @@ -NC_002945.4 4349904 17063 0 -* 0 0 223
--- a/test-data/samtools_idxstats2.tabular Mon Dec 06 18:28:04 2021 +0000 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,2 +0,0 @@ -NC_002945.4 4349904 45 4047 -* 0 0 5
--- a/test-data/samtools_idxstats3.tabular Mon Dec 06 18:28:04 2021 +0000 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,2 +0,0 @@ -NC_002945.4 4349904 24 0 -* 0 0 2
--- a/test-data/samtools_idxstats4.tabular Mon Dec 06 18:28:04 2021 +0000 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,2 +0,0 @@ -NC_002945.4 4349904 17063 0 -* 0 0 223
--- a/test-data/samtools_idxstats5.tabular Mon Dec 06 18:28:04 2021 +0000 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,2 +0,0 @@ -NC_002945.4 4349904 46 2 -* 0 0 4
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/statistics_output1.tabular Fri Jun 10 06:11:08 2022 +0000 @@ -0,0 +1,2 @@ +FASTQ File Size Read Count Length Sum Min Length Ave Length Max Length Q1 Q2 Q3 Sum Gap N50 Passing Q20 Passing Q30 Read Quality Ave +13-1941-6_S4_L001_R1_600000_fastq_gz 8.7 KB 100 10000 100 100.0 100 50.0 100.0 50.0 0 100 100.00 100.00 101.01
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/statistics_output2.tabular Fri Jun 10 06:11:08 2022 +0000 @@ -0,0 +1,2 @@ +R1 FASTQ R1 File Size R1 Read Count R1 Length Sum R1 Min Length R1 Ave Length R1 Max Length R1 Q1 R1 Q2 R1 Q3 R1 Sum Gap R1 N50 R1 Passing Q20 R1 Passing Q30 R1 Read Quality Ave R2 FASTQ R2 File Size R2 Read Count R2 Length Sum R2 Min Length R2 Ave Length R2 Max Length R2 Q1 R2 Q2 R2 Q3 R2 Sum Gap R2 N50 R2 Passing Q20 R2 Passing Q30 R2 Read Quality Ave +13-1941-6_S4_L001_R1_600000_fastq_gz 8.7 KB 100 10000 100 100.0 100 50.0 100.0 50.0 0 100 100.00 100.00 101.01 13-1941-6_S4_L001_R2_600000_fastq_gz 8.5 KB 100 10000 100 100.0 100 50.0 100.0 50.0 0 100 100.00 100.00 101.01
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/statistics_output3.tabular Fri Jun 10 06:11:08 2022 +0000 @@ -0,0 +1,2 @@ +R1 FASTQ R1 File Size R1 Read Count R1 Length Sum R1 Min Length R1 Ave Length R1 Max Length R1 Q1 R1 Q2 R1 Q3 R1 Sum Gap R1 N50 R1 Passing Q20 R1 Passing Q30 R1 Read Quality Ave R2 FASTQ R2 File Size R2 Read Count R2 Length Sum R2 Min Length R2 Ave Length R2 Max Length R2 Q1 R2 Q2 R2 Q3 R2 Sum Gap R2 N50 R2 Passing Q20 R2 Passing Q30 R2 Read Quality Ave +Unnamed Collection_R1 8.7 KB 100 10000 100 100.0 100 50.0 100.0 50.0 0 100 100.00 100.00 101.01 Unnamed Collection_R2 8.5 KB 100 10000 100 100.0 100 50.0 100.0 50.0 0 100 100.00 100.00 101.01
--- a/vsnp_add_zero_coverage.py Mon Dec 06 18:28:04 2021 +0000 +++ b/vsnp_add_zero_coverage.py Fri Jun 10 06:11:08 2022 +0000 @@ -33,15 +33,17 @@ def get_zero_df(reference): # Create a zero coverage dictionary. zero_dict = {} + reference_length = 0 for record in SeqIO.parse(reference, "fasta"): chrom = record.id total_len = len(record.seq) + reference_length = reference_length + len(record.seq) for pos in list(range(1, total_len + 1)): zero_dict["%s-%s" % (str(chrom), str(pos))] = 0 # Convert it to a data frame with depth_x # and depth_y columns - index is NaN. zero_df = pandas.DataFrame.from_dict(zero_dict, orient='index', columns=["depth"]) - return zero_df + return zero_df, reference_length def output_zc_vcf_file(base_file_name, vcf_file, zero_df, total_zero_coverage, output_vcf): @@ -82,25 +84,28 @@ return good_snp_count -def output_metrics_file(base_file_name, average_coverage, genome_coverage, good_snp_count, output_metrics): - bam_metrics = [base_file_name, "", "%4f" % average_coverage, genome_coverage] - vcf_metrics = [base_file_name, str(good_snp_count), "", ""] - metrics_columns = ["File", "Number of Good SNPs", "Average Coverage", "Genome Coverage"] +def output_metrics_file(base_file_name, average_coverage, genome_coverage, good_snp_count, dbkey, reference, + reference_length, total_zero_coverage, percent_ref_with_zero_coverage, output_metrics): + columns = ["BAM File", "Reference", "reference Length", "Genome with Coverage", "Average Depth", + "No Coverage Bases", "Percent Ref with Zero Coverage", "Quality SNPs"] + values = [base_file_name, dbkey, str(reference_length), genome_coverage, average_coverage, + str(total_zero_coverage), percent_ref_with_zero_coverage, str(good_snp_count)] with open(output_metrics, "w") as fh: - fh.write("# %s\n" % "\t".join(metrics_columns)) - fh.write("%s\n" % "\t".join(bam_metrics)) - fh.write("%s\n" % "\t".join(vcf_metrics)) + fh.write("# %s\n" % "\t".join(columns)) + fh.write("%s\n" % "\t".join(values)) -def output_files(vcf_file, total_zero_coverage, zero_df, output_vcf, average_coverage, genome_coverage, output_metrics): +def output_files(vcf_file, total_zero_coverage, percent_ref_with_zero_coverage, zero_df, output_vcf, + average_coverage, genome_coverage, output_metrics, reference, reference_length, dbkey): base_file_name = get_sample_name(vcf_file) good_snp_count = output_zc_vcf_file(base_file_name, vcf_file, zero_df, total_zero_coverage, output_vcf) - output_metrics_file(base_file_name, average_coverage, genome_coverage, good_snp_count, output_metrics) + output_metrics_file(base_file_name, average_coverage, genome_coverage, good_snp_count, dbkey, reference, + reference_length, total_zero_coverage, percent_ref_with_zero_coverage, output_metrics) -def get_coverage_and_snp_count(bam_file, vcf_file, reference, output_metrics, output_vcf): +def get_coverage_and_snp_count(bam_file, vcf_file, dbkey, reference, output_metrics, output_vcf): coverage_df = get_coverage_df(bam_file) - zero_df = get_zero_df(reference) + zero_df, reference_length = get_zero_df(reference) coverage_df = zero_df.merge(coverage_df, left_index=True, right_index=True, how='outer') # depth_x "0" column no longer needed. coverage_df = coverage_df.drop(columns=['depth_x']) @@ -109,19 +114,22 @@ coverage_df = coverage_df.fillna(0) coverage_df['depth'] = coverage_df['depth'].apply(int) total_length = len(coverage_df) - average_coverage = coverage_df['depth'].mean() + average_coverage = "{:.2f}".format(coverage_df['depth'].mean()) zero_df = coverage_df[coverage_df['depth'] == 0] total_zero_coverage = len(zero_df) + percent_ref_with_zero_coverage = "{:.6%}".format(total_zero_coverage / reference_length * 100) total_coverage = total_length - total_zero_coverage genome_coverage = "{:.2%}".format(total_coverage / total_length) # Output a zero-coverage vcf fil and the metrics file. - output_files(vcf_file, total_zero_coverage, zero_df, output_vcf, average_coverage, genome_coverage, output_metrics) + output_files(vcf_file, total_zero_coverage, percent_ref_with_zero_coverage, zero_df, output_vcf, + average_coverage, genome_coverage, output_metrics, reference, reference_length, dbkey) if __name__ == '__main__': parser = argparse.ArgumentParser() parser.add_argument('--bam_input', action='store', dest='bam_input', help='bam input file') + parser.add_argument('--dbkey', action='store', dest='dbkey', help='bam input dbkey') parser.add_argument('--output_metrics', action='store', dest='output_metrics', required=False, default=None, help='Output metrics text file') parser.add_argument('--output_vcf', action='store', dest='output_vcf', required=False, default=None, help='Output VCF file') parser.add_argument('--reference', action='store', dest='reference', help='Reference dataset') @@ -129,4 +137,4 @@ args = parser.parse_args() - get_coverage_and_snp_count(args.bam_input, args.vcf_input, args.reference, args.output_metrics, args.output_vcf) + get_coverage_and_snp_count(args.bam_input, args.vcf_input, args.dbkey, args.reference, args.output_metrics, args.output_vcf)
--- a/vsnp_build_tables.py Mon Dec 06 18:28:04 2021 +0000 +++ b/vsnp_build_tables.py Fri Jun 10 06:11:08 2022 +0000 @@ -1,6 +1,7 @@ #!/usr/bin/env python import argparse +import itertools import multiprocessing import os import queue @@ -153,11 +154,6 @@ return base_file_name -def output_cascade_table(cascade_order, mqdf, group, annotation_dict): - cascade_order_mq = pandas.concat([cascade_order, mqdf], join='inner') - output_table(cascade_order_mq, "cascade", group, annotation_dict) - - def output_excel(df, type_str, group, annotation_dict, count=None): # Output the temporary json file that # is used by the excel_formatter. @@ -183,19 +179,6 @@ excel_formatter(json_file_name, excel_file_name, group, annotation_dict) -def output_sort_table(cascade_order, mqdf, group, annotation_dict): - sort_df = cascade_order.T - sort_df['abs_value'] = sort_df.index - sort_df[['chrom', 'pos']] = sort_df['abs_value'].str.split(':', expand=True) - sort_df = sort_df.drop(['abs_value', 'chrom'], axis=1) - sort_df.pos = sort_df.pos.astype(int) - sort_df = sort_df.sort_values(by=['pos']) - sort_df = sort_df.drop(['pos'], axis=1) - sort_df = sort_df.T - sort_order_mq = pandas.concat([sort_df, mqdf], join='inner') - output_table(sort_order_mq, "sort", group, annotation_dict) - - def output_table(df, type_str, group, annotation_dict): if isinstance(group, str) and group.startswith("dataset"): # Inputs are single files, not collections, @@ -233,10 +216,6 @@ except queue.Empty: break newick_file, json_file, json_avg_mq_file = tup - avg_mq_series = pandas.read_json(json_avg_mq_file, typ='series', orient='split') - # Map quality to dataframe. - mqdf = avg_mq_series.to_frame(name='MQ') - mqdf = mqdf.T # Get the group. group = get_sample_name(newick_file) snps_df = pandas.read_json(json_file, orient='split') @@ -245,67 +224,53 @@ line = re.sub('[:,]', '\n', line) line = re.sub('[)(]', '', line) line = re.sub(r'[0-9].*\.[0-9].*\n', '', line) + line = re.sub("'", '', line) line = re.sub('root\n', '', line) sample_order = line.split('\n') - sample_order = list([_f for _f in sample_order if _f]) + sample_order = list(filter(None, sample_order)) sample_order.insert(0, 'root') - tree_order = snps_df.loc[sample_order] + tree_order_df = snps_df.loc[sample_order] + # Output the sorted table. + output_table(tree_order_df, "sort", group, annotation_dict) # Count number of SNPs in each column. snp_per_column = [] - for column_header in tree_order: + for column_header in tree_order_df: count = 0 - column = tree_order[column_header] + column = tree_order_df[column_header] for element in column: - if element != column[0]: + # column[0] is top row/root/reference, + # element is everything below it. + if element != column[0] and element != '-': count = count + 1 snp_per_column.append(count) - row1 = pandas.Series(snp_per_column, tree_order.columns, name="snp_per_column") + row1 = pandas.Series(snp_per_column, tree_order_df.columns, name="snp_per_column") # Count number of SNPS from the # top of each column in the table. snp_from_top = [] - for column_header in tree_order: + for column_header in tree_order_df: count = 0 - column = tree_order[column_header] - # for each element in the column - # skip the first element - for element in column[1:]: - if element == column[0]: - count = count + 1 - else: - break - snp_from_top.append(count) - row2 = pandas.Series(snp_from_top, tree_order.columns, name="snp_from_top") - tree_order = tree_order.append([row1]) - tree_order = tree_order.append([row2]) - # In pandas=0.18.1 even this does not work: - # abc = row1.to_frame() - # abc = abc.T --> tree_order.shape (5, 18), abc.shape (1, 18) - # tree_order.append(abc) - # Continue to get error: "*** ValueError: all the input arrays must have same number of dimensions" - tree_order = tree_order.T - tree_order = tree_order.sort_values(['snp_from_top', 'snp_per_column'], ascending=[True, False]) - tree_order = tree_order.T + column = tree_order_df[column_header] + index_list_of_ref_differences = [] + for ind, list_item in enumerate(column[1:].to_list()): + if list_item not in [column[0], '-']: + index_list_of_ref_differences.append(ind) + c = itertools.count() + val = max((list(g) for _, g in itertools.groupby(index_list_of_ref_differences, lambda x: x - next(c))), key=len) + # Starting row number with longest continous SNPs in column + snp_from_top.append(val[0]) + row2 = pandas.Series(snp_from_top, tree_order_df.columns, name="snp_from_top") + tree_order_df = tree_order_df.append([row1]) + tree_order_df = tree_order_df.append([row2]) + tree_order_df = tree_order_df.T + tree_order_df = tree_order_df.sort_values(['snp_from_top', 'snp_per_column'], ascending=[True, False]) + tree_order_df = tree_order_df.T # Remove snp_per_column and snp_from_top rows. - cascade_order = tree_order[:-2] + cascade_order_df = tree_order_df[:-2] # Output the cascade table. - output_cascade_table(cascade_order, mqdf, group, annotation_dict) - # Output the sorted table. - output_sort_table(cascade_order, mqdf, group, annotation_dict) + output_table(cascade_order_df, "cascade", group, annotation_dict) task_queue.task_done() -def set_num_cpus(num_files, processes): - num_cpus = len(os.sched_getaffinity(0)) - if num_files < num_cpus and num_files < processes: - return num_files - if num_cpus < processes: - half_cpus = int(num_cpus / 2) - if num_files < half_cpus: - return num_files - return half_cpus - return processes - - if __name__ == '__main__': parser = argparse.ArgumentParser() @@ -357,7 +322,6 @@ queue1 = multiprocessing.JoinableQueue() queue2 = multiprocessing.JoinableQueue() num_files = len(newick_files) - cpus = set_num_cpus(num_files, args.processes) # Set a timeout for get()s in the queue. timeout = 0.05 @@ -367,7 +331,7 @@ queue1.put((newick_file, json_file, json_avg_mq_file)) # Complete the preprocess_tables task. - processes = [multiprocessing.Process(target=preprocess_tables, args=(queue1, annotation_dict, timeout, )) for _ in range(cpus)] + processes = [multiprocessing.Process(target=preprocess_tables, args=(queue1, annotation_dict, timeout, )) for _ in range(args.processes)] for p in processes: p.start() for p in processes:
--- a/vsnp_build_tables.xml Mon Dec 06 18:28:04 2021 +0000 +++ b/vsnp_build_tables.xml Fri Jun 10 06:11:08 2022 +0000 @@ -110,12 +110,12 @@ <output_collection name="excel" type="list" count="2"> <element name="cascade_table" ftype="xlsx"> <assert_contents> - <has_size value="6853" delta="100"/> + <has_size value="6766" delta="100"/> </assert_contents> </element> <element name="sort_table" ftype="xlsx"> <assert_contents> - <has_size value="6847" delta="100"/> + <has_size value="6760" delta="100"/> </assert_contents> </element> </output_collection> @@ -138,41 +138,41 @@ </param> <param name="input_avg_mq_json_collection"> <collection type="list"> - <element name="Mbovis-01_snps.json" value="Mbovis-01_avg_mq.json" dbkey="89"/> - <element name="Mbovis-01D_snps.json" value="Mbovis-01D_avg_mq.json" dbkey="89"/> - <element name="Mbovis-01D6_snps.json" value="Mbovis-01D6_avg_mq.json" dbkey="89"/> + <element name="Mbovis-01_avg_mq.json" value="Mbovis-01_avg_mq.json" dbkey="89"/> + <element name="Mbovis-01D_avg_mq.json" value="Mbovis-01D_avg_mq.json" dbkey="89"/> + <element name="Mbovis-01D6_avg_mq.json" value="Mbovis-01D6_avg_mq.json" dbkey="89"/> </collection> </param> <param name="gbk_param" value="no"/> <output_collection name="excel" type="list" count="6"> <element name="Mbovis-01D6_snps_cascade_table" ftype="xlsx"> <assert_contents> - <has_size value="6854" delta="100"/> + <has_size value="6767" delta="100"/> </assert_contents> </element> <element name="Mbovis-01D6_snps_sort_table" ftype="xlsx"> <assert_contents> - <has_size value="6847" delta="100"/> + <has_size value="6761" delta="100"/> </assert_contents> </element> <element name="Mbovis-01D_snps_cascade_table" ftype="xlsx"> <assert_contents> - <has_size value="6854" delta="100"/> + <has_size value="6767" delta="100"/> </assert_contents> </element> <element name="Mbovis-01D_snps_sort_table" ftype="xlsx"> <assert_contents> - <has_size value="6847" delta="100"/> + <has_size value="6761" delta="100"/> </assert_contents> </element> <element name="Mbovis-01_snps_cascade_table" ftype="xlsx"> <assert_contents> - <has_size value="6853" delta="100"/> + <has_size value="6767" delta="100"/> </assert_contents> </element> <element name="Mbovis-01_snps_sort_table" ftype="xlsx"> <assert_contents> - <has_size value="6847" delta="100"/> + <has_size value="6761" delta="100"/> </assert_contents> </element> </output_collection>
--- a/vsnp_get_snps.py Mon Dec 06 18:28:04 2021 +0000 +++ b/vsnp_get_snps.py Fri Jun 10 06:11:08 2022 +0000 @@ -21,18 +21,6 @@ return datetime.fromtimestamp(time.time()).strftime('%Y-%m-%d %H-%M-%S') -def set_num_cpus(num_files, processes): - num_cpus = len(os.sched_getaffinity(0)) - if num_files < num_cpus and num_files < processes: - return num_files - if num_cpus < processes: - half_cpus = int(num_cpus / 2) - if num_files < half_cpus: - return num_files - return half_cpus - return processes - - def setup_all_vcfs(vcf_files, vcf_dirs): # Create the all_vcfs directory and link # all input vcf files into it for processing. @@ -465,7 +453,6 @@ multiprocessing.set_start_method('spawn') queue1 = multiprocessing.JoinableQueue() num_files = len(vcf_files) - cpus = set_num_cpus(num_files, args.processes) # Set a timeout for get()s in the queue. timeout = 0.05 @@ -495,7 +482,7 @@ queue1.put(vcf_dir) # Complete the get_snps task. - processes = [multiprocessing.Process(target=snp_finder.get_snps, args=(queue1, timeout, )) for _ in range(cpus)] + processes = [multiprocessing.Process(target=snp_finder.get_snps, args=(queue1, timeout, )) for _ in range(args.processes)] for p in processes: p.start() for p in processes:
--- a/vsnp_statistics.py Mon Dec 06 18:28:04 2021 +0000 +++ b/vsnp_statistics.py Fri Jun 10 06:11:08 2022 +0000 @@ -1,25 +1,29 @@ #!/usr/bin/env python import argparse -import gzip import os -from functools import partial - -import numpy -import pandas -from Bio import SeqIO class Statistics: - def __init__(self, reference, fastq_file, file_size, total_reads, mean_read_length, mean_read_quality, reads_passing_q30): - self.reference = reference - self.fastq_file = fastq_file + def __init__(self, file_name, file_size, seq_type, num_seqs, sum_len, min_len, avg_len, + max_len, q1, q2, q3, sum_gap, n50, pass_q20, pass_q30, read_quality_average): + self.file_name = file_name self.file_size = file_size - self.total_reads = total_reads - self.mean_read_length = mean_read_length - self.mean_read_quality = mean_read_quality - self.reads_passing_q30 = reads_passing_q30 + self.seq_type = seq_type + self.num_seqs = num_seqs + self.sum_len = sum_len + self.min_len = min_len + self.avg_len = avg_len + self.max_len = max_len + self.q1 = q1 + self.q2 = q2 + self.q3 = q3 + self.sum_gap = sum_gap + self.n50 = n50 + self.pass_q20 = pass_q20 + self.pass_q30 = pass_q30 + self.read_quality_average = read_quality_average def nice_size(size): @@ -43,75 +47,19 @@ return '??? bytes' -def get_statistics(dbkey, fastq_file, gzipped): - sampling_size = 10000 - # Read fastq_file into a data fram to - # get the phred quality scores. - _open = partial(gzip.open, mode='rt') if gzipped else open - with _open(fastq_file) as fh: - identifiers = [] - seqs = [] - letter_annotations = [] - for seq_record in SeqIO.parse(fh, "fastq"): - identifiers.append(seq_record.id) - seqs.append(seq_record.seq) - letter_annotations.append(seq_record.letter_annotations["phred_quality"]) - # Convert lists to Pandas series. - s1 = pandas.Series(identifiers, name='id') - s2 = pandas.Series(seqs, name='seq') - # Gather Series into a data frame. - fastq_df = pandas.DataFrame(dict(id=s1, seq=s2)).set_index(['id']) - # Starting at row 3, keep every 4 row - # random sample specified number of rows. - file_size = nice_size(os.path.getsize(fastq_file)) - total_reads = len(seqs) - # Mean Read Length - if sampling_size > total_reads: - sampling_size = total_reads - try: - fastq_df = fastq_df.iloc[3::4].sample(sampling_size) - except ValueError: - fastq_df = fastq_df.iloc[3::4].sample(sampling_size, replace=True) - dict_mean = {} - list_length = [] - i = 0 - for id, seq, in fastq_df.iterrows(): - dict_mean[id] = numpy.mean(letter_annotations[i]) - list_length.append(len(seq.array[0])) - i += 1 - mean_read_length = '%.1f' % numpy.mean(list_length) - # Mean Read Quality - df_mean = pandas.DataFrame.from_dict(dict_mean, orient='index', columns=['ave']) - mean_read_quality = '%.1f' % df_mean['ave'].mean() - # Reads Passing Q30 - reads_gt_q30 = len(df_mean[df_mean['ave'] >= 30]) - reads_passing_q30 = '{:10.2f}'.format(reads_gt_q30 / sampling_size) - stats = Statistics(dbkey, os.path.basename(fastq_file), file_size, total_reads, mean_read_length, - mean_read_quality, reads_passing_q30) - return stats - - -def accrue_statistics(dbkey, read1, read2, gzipped): - read1_stats = get_statistics(dbkey, read1, gzipped) - if read2 is None: - read2_stats = None - else: - read2_stats = get_statistics(dbkey, read2, gzipped) - return read1_stats, read2_stats - - -def output_statistics(read1_stats, read2_stats, idxstats_file, metrics_file, output_file): +def output_statistics(read1_stats, read2_stats, output_file): paired_reads = read2_stats is not None if paired_reads: - columns = ['Read1 FASTQ', 'File Size', 'Reads', 'Mean Read Length', 'Mean Read Quality', - 'Reads Passing Q30', 'Read2 FASTQ', 'File Size', 'Reads', 'Mean Read Length', 'Mean Read Quality', - 'Reads Passing Q30', 'Total Reads', 'All Mapped Reads', 'Unmapped Reads', - 'Unmapped Reads Percentage of Total', 'Reference with Coverage', 'Average Depth of Coverage', - 'Good SNP Count', 'Reference'] + columns = ['R1 FASTQ', 'R1 File Size', 'R1 Read Count', 'R1 Length Sum', 'R1 Min Length', + 'R1 Ave Length', 'R1 Max Length', 'R1 Q1', 'R1 Q2', 'R1 Q3', 'R1 Sum Gap', + 'R1 N50', 'R1 Passing Q20', 'R1 Passing Q30', 'R1 Read Quality Ave', 'R2 FASTQ', + 'R2 File Size', 'R2 Read Count', 'R2 Length Sum', 'R2 Min Length', 'R2 Ave Length', + 'R2 Max Length', 'R2 Q1', 'R2 Q2', 'R2 Q3', 'R2 Sum Gap', 'R2 N50', 'R2 Passing Q20', + 'R2 Passing Q30', 'R2 Read Quality Ave'] else: - columns = ['FASTQ', 'File Size', 'Mean Read Length', 'Mean Read Quality', 'Reads Passing Q30', - 'Total Reads', 'All Mapped Reads', 'Unmapped Reads', 'Unmapped Reads Percentage of Total', - 'Reference with Coverage', 'Average Depth of Coverage', 'Good SNP Count', 'Reference'] + columns = ['FASTQ', 'File Size', 'Read Count', 'Length Sum', 'Min Length', 'Ave Length', + 'Max Length', 'Q1', 'Q2', 'Q3', 'Sum Gap', 'N50', 'Passing Q20', 'Passing Q30', + 'Read Quality Ave'] with open(output_file, "w") as outfh: # Make sure the header starts with a # so # MultiQC can properly handle the output. @@ -119,97 +67,102 @@ line_items = [] # Get the current stats and associated files. # Get and output the statistics. - line_items.append(read1_stats.fastq_file) + line_items.append(read1_stats.file_name) line_items.append(read1_stats.file_size) - if paired_reads: - line_items.append(read1_stats.total_reads) - line_items.append(read1_stats.mean_read_length) - line_items.append(read1_stats.mean_read_quality) - line_items.append(read1_stats.reads_passing_q30) - if paired_reads: - line_items.append(read2_stats.fastq_file) - line_items.append(read2_stats.file_size) - line_items.append(read2_stats.total_reads) - line_items.append(read2_stats.mean_read_length) - line_items.append(read2_stats.mean_read_quality) - line_items.append(read2_stats.reads_passing_q30) - # Total Reads + line_items.append(read1_stats.num_seqs) + line_items.append(read1_stats.sum_len) + line_items.append(read1_stats.min_len) + line_items.append(read1_stats.avg_len) + line_items.append(read1_stats.max_len) + line_items.append(read1_stats.q1) + line_items.append(read1_stats.q2) + line_items.append(read1_stats.q3) + line_items.append(read1_stats.sum_gap) + line_items.append(read1_stats.n50) + line_items.append(read1_stats.pass_q20) + line_items.append(read1_stats.pass_q30) + line_items.append(read1_stats.read_quality_average) if paired_reads: - total_reads = read1_stats.total_reads + read2_stats.total_reads - else: - total_reads = read1_stats.total_reads - line_items.append(total_reads) - # All Mapped Reads - all_mapped_reads, unmapped_reads = process_idxstats_file(idxstats_file) - line_items.append(all_mapped_reads) - line_items.append(unmapped_reads) - # Unmapped Reads Percentage of Total - if unmapped_reads > 0: - unmapped_reads_percentage = '{:10.2f}'.format(unmapped_reads / total_reads) - else: - unmapped_reads_percentage = 0 - line_items.append(unmapped_reads_percentage) - # Reference with Coverage - ref_with_coverage, avg_depth_of_coverage, good_snp_count = process_metrics_file(metrics_file) - line_items.append(ref_with_coverage) - line_items.append(avg_depth_of_coverage) - line_items.append(good_snp_count) - line_items.append(read1_stats.reference) + line_items.append(read2_stats.file_name) + line_items.append(read2_stats.file_size) + line_items.append(read2_stats.num_seqs) + line_items.append(read2_stats.sum_len) + line_items.append(read2_stats.min_len) + line_items.append(read2_stats.avg_len) + line_items.append(read2_stats.max_len) + line_items.append(read2_stats.q1) + line_items.append(read2_stats.q2) + line_items.append(read2_stats.q3) + line_items.append(read2_stats.sum_gap) + line_items.append(read2_stats.n50) + line_items.append(read2_stats.pass_q20) + line_items.append(read2_stats.pass_q30) + line_items.append(read2_stats.read_quality_average) outfh.write('%s\n' % '\t'.join(str(x) for x in line_items)) -def process_idxstats_file(idxstats_file): - all_mapped_reads = 0 - unmapped_reads = 0 - with open(idxstats_file, "r") as fh: +def get_statistics(fastq_file, seqkit_stats_file, seqkit_fx2tab_file): + file_size = nice_size(os.path.getsize(fastq_file)) + # SeqKit statistics. + with open(seqkit_stats_file, "r") as fh: + # This is a 2-line file for i, line in enumerate(fh): - line = line.rstrip('\r\n') - items = line.split("\t") if i == 0: - # NC_002945.4 4349904 213570 4047 - all_mapped_reads = int(items[2]) - elif i == 1: - # * 0 0 82774 - unmapped_reads = int(items[3]) - return all_mapped_reads, unmapped_reads - - -def process_metrics_file(metrics_file): - ref_with_coverage = '0%' - avg_depth_of_coverage = 0 - good_snp_count = 0 - with open(metrics_file, "r") as ifh: - for i, line in enumerate(ifh): - if i == 0: - # Skip comments. + # Skip header continue line = line.rstrip('\r\n') items = line.split("\t") - if i == 1: - # MarkDuplicates 10.338671 98.74% - ref_with_coverage = items[3] - avg_depth_of_coverage = items[2] - elif i == 2: - # VCFfilter 611 - good_snp_count = items[1] - return ref_with_coverage, avg_depth_of_coverage, good_snp_count + file_name = fastq_file + seq_type = items[2] + num_seqs = items[3] + sum_len = items[4] + min_len = items[5] + avg_len = items[6] + max_len = items[7] + q1 = items[8] + q2 = items[9] + q3 = items[10] + sum_gap = items[11] + n50 = items[12] + try: + pass_q20 = items[13] + except IndexError: + pass_q20 = 0 + try: + pass_q30 = items[14] + except IndexError: + pass_q30 = 0 + # Average read quality is not normalized on length. + avg_sum = 0 + with open(seqkit_fx2tab_file, "r") as fh: + for i, line in enumerate(fh): + if i == 0: + # Skip header + continue + line = line.rstrip('\r\n') + items = line.split("\t") + avg_sum += float(items[3]) + read_quality_average = "{:.2f}".format(avg_sum / float(i - 1)) + return Statistics(file_name, file_size, seq_type, num_seqs, sum_len, min_len, avg_len, + max_len, q1, q2, q3, sum_gap, n50, pass_q20, pass_q30, read_quality_average) parser = argparse.ArgumentParser() -parser.add_argument('--dbkey', action='store', dest='dbkey', help='Reference dbkey') -parser.add_argument('--gzipped', action='store_true', dest='gzipped', required=False, default=False, help='Input files are gzipped') parser.add_argument('--output', action='store', dest='output', help='Output Excel statistics file') parser.add_argument('--read1', action='store', dest='read1', help='Required: single read') parser.add_argument('--read2', action='store', dest='read2', required=False, default=None, help='Optional: paired read') -parser.add_argument('--samtools_idxstats', action='store', dest='samtools_idxstats', help='Output of samtools_idxstats') -parser.add_argument('--vsnp_azc_metrics', action='store', dest='vsnp_azc_metrics', help='Output of vsnp_add_zero_coverage') +parser.add_argument('--read1_seqkit_stats', action='store', dest='read1_seqkit_stats', help='Output of SeqKit statistics for forward read') +parser.add_argument('--read2_seqkit_stats', action='store', dest='read2_seqkit_stats', required=False, default=None, help='Output of SeqKit statistics for reverse read') +parser.add_argument('--read1_seqkit_fx2tab', action='store', dest='read1_seqkit_fx2tab', help='Output of SeqKit fx2tab for forward read') +parser.add_argument('--read2_seqkit_fx2tab', action='store', dest='read2_seqkit_fx2tab', required=False, default=None, help='Output of SeqKit fx2tab for reverse read') args = parser.parse_args() -stats_list = [] -idxstats_files = [] -metrics_files = [] -# Accumulate inputs. -read1_stats, read2_stats = accrue_statistics(args.dbkey, args.read1, args.read2, args.gzipped) -output_statistics(read1_stats, read2_stats, args.samtools_idxstats, args.vsnp_azc_metrics, args.output) +read1_stats = get_statistics(args.read1, args.read1_seqkit_stats, args.read1_seqkit_fx2tab) +if args.read2 is None: + read2_stats = None +else: + read2_stats = get_statistics(args.read2, args.read2_seqkit_stats, args.read2_seqkit_fx2tab) + +output_statistics(read1_stats, read2_stats, args.output)