# HG changeset patch
# User iuc
# Date 1605131691 0
# Node ID 60573349e9aeec709b78066044afad7603c0e3af
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/shasta commit 6d14992ea4fb1af09373d51b3a48166afcbd3a74"
diff -r 000000000000 -r 60573349e9ae configs/Nanopore-Dec2019.conf
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/configs/Nanopore-Dec2019.conf Wed Nov 11 21:54:51 2020 +0000
@@ -0,0 +1,51 @@
+# This file contains Shasta options that, as of December 2019,
+# are known to work with Oxford Nanopore reads under the following
+# circumstances:
+
+# - Human genome assembly.
+# - Coverage between 40x and 80x. If you have more coverage than that,
+# you can use option "--Reads.minReadLength" to adjust coverage as desired.
+# - Reads from Guppy 3.0.5 base caller. Also known to work with
+# reads from other Guppy releases 3.0.x and 3.1.x.
+
+# To use this configuration file, specify Shasta option "--config PathToThisFile".
+# If you specify any conflicting values on the command line,
+# the values specified on the command line take precedence.
+
+# In most cases, for best performance on a large assembly
+# you will usually also want to use the following options, which
+# cannot be specified in a configuration file:
+# --memoryMode filesystem
+# --memoryBacking 2M
+# Using these options require root access.
+
+# For detailed information on all available options see here:
+# https://chanzuckerberg.github.io/shasta/CommandLineOptions.html
+
+# For information on running a small assembly for which
+# performance is not essential see here:
+# https://chanzuckerberg.github.io/shasta/QuickStart.html
+
+# For more information on running an assembly see here:
+# https://chanzuckerberg.github.io/shasta/Running.html
+
+# For information on optimizing assembly performance see here:
+# https://chanzuckerberg.github.io/shasta/Performance.html
+
+
+
+[Reads]
+# If you have extra coverage, use this option to adjust coverage.
+minReadLength = 10000
+
+[MinHash]
+minBucketSize = 5
+maxBucketSize = 30
+minFrequency = 5
+
+[Align]
+minAlignedFraction = 0.4
+
+[Assembly]
+consensusCaller = Bayesian:guppy-3.0.5-a
+
diff -r 000000000000 -r 60573349e9ae configs/Nanopore-Jun2020.conf
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/configs/Nanopore-Jun2020.conf Wed Nov 11 21:54:51 2020 +0000
@@ -0,0 +1,74 @@
+# DO NOT USE THIS FILE IF YOU HAVE READS CREATED BY A
+# GUPPY VERSION OLDER THAN 3.6.0.
+
+# This file contains Shasta options that, as of June 2020,
+# are known to work with Oxford Nanopore reads under the following
+# circumstances:
+
+# - Human genome assembly.
+# - Coverage between 40x and 80x. If you have more coverage than that,
+# you can use option "--Reads.minReadLength" to adjust coverage as desired.
+# - Reads from Guppy 3.6.0 base caller. If you have reads
+# from an older version of Guppy, use configuration file
+# Nanopore-Dec2019.conf instead.
+
+# To use this configuration file, specify Shasta option
+# "--config AbsolutePathToThisFile".
+# If you specify any conflicting values on the command line,
+# the values specified on the command line take precedence.
+
+# In most cases, for best performance on a large assembly
+# you will usually also want to use the following options, which
+# cannot be specified in a configuration file:
+# --memoryMode filesystem
+# --memoryBacking 2M
+# Using these options requires root access.
+
+# For detailed information on all available options see here:
+# https://chanzuckerberg.github.io/shasta/CommandLineOptions.html
+
+# For information on running a small assembly for which
+# performance is not essential see here:
+# https://chanzuckerberg.github.io/shasta/QuickStart.html
+
+# For more information on running an assembly see here:
+# https://chanzuckerberg.github.io/shasta/Running.html
+
+# For information on optimizing assembly performance see here:
+# https://chanzuckerberg.github.io/shasta/Performance.html
+
+
+
+[Reads]
+# If you have extra coverage, use this option to adjust coverage.
+minReadLength = 10000
+noCache = True
+
+[Kmers]
+# Due to the higher accuracy of Guppy 3.6.0 we use longer
+# markers than usual.
+k = 14
+
+[MinHash]
+minBucketSize = 5
+maxBucketSize = 30
+minFrequency = 5
+
+[Align]
+alignMethod = 3
+downsamplingFactor = 0.05
+matchScore = 6
+minAlignedFraction = 0.55
+minAlignedMarkerCount = 400
+sameChannelReadAlignment.suppressDeltaThreshold = 30
+
+[MarkerGraph]
+simplifyMaxLength = 10,100,1000,10000,100000
+refineThreshold = 6
+crossEdgeCoverageThreshold = 3
+
+[Assembly]
+consensusCaller = Bayesian:guppy-3.6.0-a
+detangleMethod = 1
+
+
diff -r 000000000000 -r 60573349e9ae configs/Nanopore-OldGuppy-Sep2020.conf
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/configs/Nanopore-OldGuppy-Sep2020.conf Wed Nov 11 21:54:51 2020 +0000
@@ -0,0 +1,83 @@
+# This file contains Shasta options which attempt to partially automate
+# parameter selection. It is based on an earlier config, which, as of Jun 2020,
+# was known to work with Oxford Nanopore reads under the following circumstances:
+
+# - Human genome assembly.
+# - Coverage between 40x and 80x. If you have more coverage than that,
+# you can use option "--Reads.minReadLength" to adjust coverage as desired.
+# - Reads from Guppy 3.0.5 base caller. Also known to work with
+# reads from other Guppy releases 3.0.x and 3.1.x.
+
+# The automation provided by this config is particularly applicable to
+# low coverage or non-human samples. It also matches or exceeds continuity
+# in human samples, relative to the appropriately chosen config file.
+# Updating to guppy 3.6.0 or higher will greatly improve assembly
+# quality and is therefore strongly recommended.
+
+# To use this configuration file, specify Shasta option
+# "--config AbsolutePathToThisFile".
+# If you specify any conflicting values on the command line,
+# the values specified on the command line take precedence.
+
+# In most cases, for best performance on a large assembly
+# you will usually also want to use the following options, which
+# cannot be specified in a configuration file:
+# --memoryMode filesystem
+# --memoryBacking 2M
+# Using these options requires root access.
+
+# For detailed information on all available options see here:
+# https://chanzuckerberg.github.io/shasta/CommandLineOptions.html
+
+# For information on running a small assembly for which
+# performance is not essential see here:
+# https://chanzuckerberg.github.io/shasta/QuickStart.html
+
+# For more information on running an assembly see here:
+# https://chanzuckerberg.github.io/shasta/Running.html
+
+# For information on optimizing assembly performance see here:
+# https://chanzuckerberg.github.io/shasta/Performance.html
+
+
+
+[Reads]
+# If you have extra coverage, use this option to adjust coverage.
+minReadLength = 10000
+noCache = True
+
+[MinHash]
+minBucketSize = 5
+maxBucketSize = 30
+minFrequency = 5
+
+[Align]
+alignMethod = 3
+downsamplingFactor = 0.05
+matchScore = 6
+sameChannelReadAlignment.suppressDeltaThreshold = 30
+
+# The following Align parameters are set to very permissive values to allow the majority of alignments
+# to be assessed during the initial stage of automatic alignment parameter selection
+maxSkip = 100
+maxDrift = 100
+maxTrim = 100
+minAlignedMarkerCount = 10
+minAlignedFraction = 0.1
+
+[ReadGraph]
+# This method uses the observed distribution of alignment stats to choose a cutoff for
+# maxSkip, maxDrift, maxTrim, minAlignedMarkerCount, and minAlignedFraction
+creationMethod = 2
+
+[MarkerGraph]
+simplifyMaxLength = 10,100,1000,10000,100000
+crossEdgeCoverageThreshold = 3
+
+# Automatically determine this using PeakFinder
+minCoverage = 0
+
+[Assembly]
+consensusCaller = Bayesian:guppy-3.0.5-a
+detangleMethod = 2
+
diff -r 000000000000 -r 60573349e9ae configs/Nanopore-Sep2020.conf
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/configs/Nanopore-Sep2020.conf Wed Nov 11 21:54:51 2020 +0000
@@ -0,0 +1,94 @@
+# DO NOT USE THIS FILE IF YOU HAVE READS CREATED BY A
+# GUPPY VERSION OLDER THAN 3.6.0.
+
+# This file contains Shasta options which attempt to partially automate
+# parameter selection. It is based on an earlier config, which, as of Jun 2020,
+# was known to work with Oxford Nanopore reads under the following circumstances:
+
+# - Human genome assembly.
+# - Coverage between 40x and 80x. If you have more coverage than that,
+# you can use option "--Reads.minReadLength" to adjust coverage as desired.
+# - Reads from Guppy 3.6.0 base caller. If you have reads
+# from an older version of Guppy, use configuration file
+# Nanopore-Dec2019.conf instead.
+
+# The automation provided by this config is particularly applicable to
+# low coverage or non-human samples. It also matches or exceeds continuity
+# in human samples, relative to the appropriately chosen 3.6.0 or 3.6.0-UL conf.
+# Automation can also be activated with parameters designed for earlier basecallers,
+# if needed, but updating to guppy 3.6.0 or higher will greatly improve assembly
+# quality and is therefore strongly recommended.
+
+# To use this configuration file, specify Shasta option
+# "--config AbsolutePathToThisFile".
+# If you specify any conflicting values on the command line,
+# the values specified on the command line take precedence.
+
+# In most cases, for best performance on a large assembly
+# you will usually also want to use the following options, which
+# cannot be specified in a configuration file:
+# --memoryMode filesystem
+# --memoryBacking 2M
+# Using these options requires root access.
+
+# For detailed information on all available options see here:
+# https://chanzuckerberg.github.io/shasta/CommandLineOptions.html
+
+# For information on running a small assembly for which
+# performance is not essential see here:
+# https://chanzuckerberg.github.io/shasta/QuickStart.html
+
+# For more information on running an assembly see here:
+# https://chanzuckerberg.github.io/shasta/Running.html
+
+# For information on optimizing assembly performance see here:
+# https://chanzuckerberg.github.io/shasta/Performance.html
+
+
+
+[Reads]
+# If you have extra coverage, use this option to adjust coverage.
+minReadLength = 10000
+noCache = True
+
+[Kmers]
+# Due to the higher accuracy of Guppy 3.6.0 we use longer
+# markers than usual.
+k = 14
+
+[MinHash]
+minBucketSize = 5
+maxBucketSize = 30
+minFrequency = 5
+
+[Align]
+alignMethod = 3
+downsamplingFactor = 0.05
+matchScore = 6
+sameChannelReadAlignment.suppressDeltaThreshold = 30
+
+# The following Align parameters are set to very permissive values to allow the majority of alignments
+# to be assessed during the initial stage of automatic alignment parameter selection
+maxSkip = 100
+maxDrift = 100
+maxTrim = 100
+minAlignedMarkerCount = 10
+minAlignedFraction = 0.1
+
+[ReadGraph]
+# This method uses the observed distribution of alignment stats to choose a cutoff for
+# maxSkip, maxDrift, maxTrim, minAlignedMarkerCount, and minAlignedFraction
+creationMethod = 2
+
+[MarkerGraph]
+simplifyMaxLength = 10,100,1000,10000,100000
+crossEdgeCoverageThreshold = 3
+
+# Automatically determine this using PeakFinder
+minCoverage = 0
+
+[Assembly]
+consensusCaller = Bayesian:guppy-3.6.0-a
+detangleMethod = 2
+
+
diff -r 000000000000 -r 60573349e9ae configs/Nanopore-UL-Dec2019.conf
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/configs/Nanopore-UL-Dec2019.conf Wed Nov 11 21:54:51 2020 +0000
@@ -0,0 +1,53 @@
+# This file contains Shasta options that, as of December 2019,
+# are known to work with Ultra-Long (UL) Oxford Nanopore reads
+# under the following circumstances:
+
+# - Human genome assembly.
+# - Coverage between 40x and 80x. If you have more coverage than that,
+# you can use option "--Reads.minReadLength" to adjust coverage as desired.
+# - Reads from Guppy 3.0.5 base caller. Also known to work with
+# reads from other Guppy releases 3.0.x and 3.1.x.
+
+# To use this configuration file, specify Shasta option "--config PathToThisFile".
+# If you specify any conflicting values on the command line,
+# the values specified on the command line take precedence.
+
+# In most cases, for best performance on a large assembly
+# you will usually also want to use the following options, which
+# cannot be specified in a configuration file:
+# --memoryMode filesystem
+# --memoryBacking 2M
+# Using these options require root access.
+
+# For detailed information on all available options see here:
+# https://chanzuckerberg.github.io/shasta/CommandLineOptions.html
+
+# For information on running a small assembly for which
+# performance is not essential see here:
+# https://chanzuckerberg.github.io/shasta/QuickStart.html
+
+# For more information on running an assembly see here:
+# https://chanzuckerberg.github.io/shasta/Running.html
+
+# For information on optimizing assembly performance see here:
+# https://chanzuckerberg.github.io/shasta/Performance.html
+
+
+
+[Reads]
+# If you have extra coverage, use this option to adjust coverage.
+minReadLength = 50000
+
+[MinHash]
+minBucketSize = 5
+maxBucketSize = 40
+minFrequency = 10
+
+[Align]
+maxSkip = 60
+maxDrift = 60
+minAlignedMarkerCount = 400
+
+[Assembly]
+consensusCaller = Bayesian:guppy-3.0.5-a
+
diff -r 000000000000 -r 60573349e9ae configs/Nanopore-UL-Jun2020.conf
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/configs/Nanopore-UL-Jun2020.conf Wed Nov 11 21:54:51 2020 +0000
@@ -0,0 +1,78 @@
+# DO NOT USE THIS FILE IF YOU HAVE READS CREATED BY A
+# GUPPY VERSION OLDER THAN 3.6.0.
+
+# This file contains Shasta options that, as of June 2020,
+# are known to work with Ultra-Long (UL) Oxford Nanopore reads
+# under the following circumstances:
+
+# - Human genome assembly.
+# - Coverage between 40x and 80x. If you have more coverage than that,
+# you can use option "--Reads.minReadLength" to adjust coverage as desired.
+# - Reads from Guppy 3.6.0 base caller. If you have reads
+# from an older version of Guppy, use configuration file
+# Nanopore-UL-Dec2019.conf instead.
+
+# To use this configuration file, specify Shasta option
+# "--config AbsolutePathToThisFile".
+# If you specify any conflicting values on the command line,
+# the values specified on the command line take precedence.
+
+# In most cases, for best performance on a large assembly
+# you will usually also want to use the following options, which
+# cannot be specified in a configuration file:
+# --memoryMode filesystem
+# --memoryBacking 2M
+# Using these options requires root access.
+
+# For detailed information on all available options see here:
+# https://chanzuckerberg.github.io/shasta/CommandLineOptions.html
+
+# For information on running a small assembly for which
+# performance is not essential see here:
+# https://chanzuckerberg.github.io/shasta/QuickStart.html
+
+# For more information on running an assembly see here:
+# https://chanzuckerberg.github.io/shasta/Running.html
+
+# For information on optimizing assembly performance see here:
+# https://chanzuckerberg.github.io/shasta/Performance.html
+
+
+
+[Reads]
+# If you have extra coverage, use this option to adjust coverage.
+minReadLength = 50000
+noCache = True
+
+[Kmers]
+# Due to the higher accuracy of Guppy 3.6.0 we use longer
+# markers than usual.
+k = 14
+
+[MinHash]
+minBucketSize = 10
+maxBucketSize = 30
+minFrequency = 5
+
+[Align]
+alignMethod = 3
+downsamplingFactor = 0.05
+matchScore = 6
+minAlignedFraction = 0.55
+minAlignedMarkerCount = 600
+sameChannelReadAlignment.suppressDeltaThreshold = 30
+
+[ReadGraph]
+maxAlignmentCount = 12
+
+
+[MarkerGraph]
+simplifyMaxLength = 10,100,1000,10000,100000
+refineThreshold = 6
+crossEdgeCoverageThreshold = 3
+
+[Assembly]
+consensusCaller = Bayesian:guppy-3.6.0-a
+detangleMethod = 1
+
+
diff -r 000000000000 -r 60573349e9ae configs/Nanopore-UL-Sep2020.conf
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/configs/Nanopore-UL-Sep2020.conf Wed Nov 11 21:54:51 2020 +0000
@@ -0,0 +1,89 @@
+# DO NOT USE THIS FILE IF YOU HAVE READS CREATED BY A
+# GUPPY VERSION OLDER THAN 3.6.0.
+
+# This file contains Shasta options which attempt to partially automate
+# parameter selection. It is based on an earlier config, which, as of Jun 2020,
+# was known to work with Oxford Nanopore reads under the following circumstances:
+
+# - Human genome assembly.
+# - Coverage between 40x and 80x. If you have more coverage than that,
+# you can use option "--Reads.minReadLength" to adjust coverage as desired.
+# - Reads from Guppy 3.6.0 base caller. If you have reads
+# from an older version of Guppy, use configuration file
+# Nanopore-UL-Dec2019.conf instead.
+
+# The automation provided by this config is particularly applicable to
+# low coverage or non-human samples. It also matches or exceeds continuity
+# in human samples, relative to the appropriately chosen 3.6.0 or 3.6.0-UL conf.
+# Automation can be activated with parameters designed for earlier basecallers,
+# if needed, but updating to guppy 3.6.0 or higher will greatly improve assembly
+# quality and is therefore strongly recommended.
+
+# In most cases, for best performance on a large assembly
+# you will usually also want to use the following options, which
+# cannot be specified in a configuration file:
+# --memoryMode filesystem
+# --memoryBacking 2M
+# Using these options requires root access.
+
+# For detailed information on all available options see here:
+# https://chanzuckerberg.github.io/shasta/CommandLineOptions.html
+
+# For information on running a small assembly for which
+# performance is not essential see here:
+# https://chanzuckerberg.github.io/shasta/QuickStart.html
+
+# For more information on running an assembly see here:
+# https://chanzuckerberg.github.io/shasta/Running.html
+
+# For information on optimizing assembly performance see here:
+# https://chanzuckerberg.github.io/shasta/Performance.html
+
+
+
+[Reads]
+# If you have extra coverage, use this option to adjust coverage.
+minReadLength = 50000
+noCache = True
+
+[Kmers]
+# Due to the higher accuracy of Guppy 3.6.0 we use longer
+# markers than usual.
+k = 14
+
+[MinHash]
+minBucketSize = 10
+maxBucketSize = 30
+minFrequency = 5
+
+[Align]
+alignMethod = 3
+downsamplingFactor = 0.05
+matchScore = 6
+sameChannelReadAlignment.suppressDeltaThreshold = 30
+
+# The following Align parameters are set to very permissive values to allow the majority of alignments
+# to be assessed during the initial stage of automatic alignment parameter selection
+maxSkip = 100
+maxDrift = 100
+maxTrim = 100
+minAlignedMarkerCount = 10
+minAlignedFraction = 0.1
+
+[ReadGraph]
+# This method uses the observed distribution of alignment stats to choose a cutoff for
+# maxSkip, maxDrift, maxTrim, minAlignedMarkerCount, and minAlignedFraction
+creationMethod = 2
+
+[MarkerGraph]
+simplifyMaxLength = 10,100,1000,10000,100000
+crossEdgeCoverageThreshold = 3
+
+# Automatically determine this using PeakFinder
+minCoverage = 0
+
+[Assembly]
+consensusCaller = Bayesian:guppy-3.6.0-a
+detangleMethod = 2
+
+
diff -r 000000000000 -r 60573349e9ae configs/Nanopore-UL-iterative-Sep2020.conf
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/configs/Nanopore-UL-iterative-Sep2020.conf Wed Nov 11 21:54:51 2020 +0000
@@ -0,0 +1,46 @@
+# This configuration file is EXPERIMENTAL and should only
+# be used under the following conditions:
+# - Nanopore reads created by Guppy 3.6.0 or newer.
+# - Ultra-Long (UL) reads with typical N50 80Kb or more.
+# - High coverage 80X.
+# Iterative assembly results in some separation of haplotypes
+# and does better at resolving segmental duplications.
+
+[Reads]
+minReadLength = 30000
+noCache = True
+
+[Kmers]
+k = 10
+
+[MinHash]
+minBucketSize = 10
+maxBucketSize = 40
+minFrequency = 5
+
+[Align]
+alignMethod = 3
+matchScore = 6
+gapScore = -3
+downsamplingFactor = 0.05
+maxSkip = 100
+maxDrift = 100
+maxTrim = 100
+minAlignedMarkerCount = 10
+minAlignedFraction = 0.1
+sameChannelReadAlignment.suppressDeltaThreshold = 30
+
+[ReadGraph]
+maxAlignmentCount = 12
+creationMethod = 2
+
+[MarkerGraph]
+minCoveragePerStrand = 3
+simplifyMaxLength = 10,100
+crossEdgeCoverageThreshold = 3
+
+[Assembly]
+detangleMethod = 2
+consensusCaller = Bayesian:guppy-3.6.0-a
+iterative = True
+
diff -r 000000000000 -r 60573349e9ae configs/PacBio-CCS-Dec2019.conf
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/configs/PacBio-CCS-Dec2019.conf Wed Nov 11 21:54:51 2020 +0000
@@ -0,0 +1,50 @@
+# This file contains Shasta options that, as of December 2019,
+# are known to work with PacBio CCS reads under the following
+# circumstances:
+
+# - Human genome assembly.
+# - Coverage between 40x and 80x. If you have more coverage than that,
+# you can use option "--Reads.minReadLength" to adjust coverage as desired.
+
+# To use this configuration file, specify Shasta option "--config PathToThisFile".
+# If you specify any conflicting values on the command line,
+# the values specified on the command line take precedence.
+
+# In most cases, for best performance on a large assembly
+# you will usually also want to use the following options, which
+# cannot be specified in a configuration file:
+# --memoryMode filesystem
+# --memoryBacking 2M
+# Using these options require root access.
+
+# For detailed information on all available options see here:
+# https://chanzuckerberg.github.io/shasta/CommandLineOptions.html
+
+# For information on running a small assembly for which
+# performance is not essential see here:
+# https://chanzuckerberg.github.io/shasta/QuickStart.html
+
+# For more information on running an assembly see here:
+# https://chanzuckerberg.github.io/shasta/Running.html
+
+# For information on optimizing assembly performance see here:
+# https://chanzuckerberg.github.io/shasta/Performance.html
+
+[Kmers]
+k = 15
+probability = 0.02
+
+[MinHash]
+m = 12
+minBucketSize = 20
+maxBucketSize = 100
+minHashIterationCount = 25
+minFrequency = 10
+
+[ReadGraph]
+maxAlignmentCount = 20
+
+[Assembly]
+consensusCaller = Modal
+
+
diff -r 000000000000 -r 60573349e9ae configs/PacBio-CLR-Dec2019.conf
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/configs/PacBio-CLR-Dec2019.conf Wed Nov 11 21:54:51 2020 +0000
@@ -0,0 +1,45 @@
+# This file contains Shasta options that, as of December 2019,
+# are known to work with PacBio CLR reads under the following
+# circumstances:
+
+# - Human genome assembly.
+# - Coverage between 40x and 80x. If you have more coverage than that,
+# you can use option "--Reads.minReadLength" to adjust coverage as desired.
+
+# To use this configuration file, specify Shasta option "--config PathToThisFile".
+# If you specify any conflicting values on the command line,
+# the values specified on the command line take precedence.
+
+# In most cases, for best performance on a large assembly
+# you will usually also want to use the following options, which
+# cannot be specified in a configuration file:
+# --memoryMode filesystem
+# --memoryBacking 2M
+# Using these options require root access.
+
+# For detailed information on all available options see here:
+# https://chanzuckerberg.github.io/shasta/CommandLineOptions.html
+
+# For information on running a small assembly for which
+# performance is not essential see here:
+# https://chanzuckerberg.github.io/shasta/QuickStart.html
+
+# For more information on running an assembly see here:
+# https://chanzuckerberg.github.io/shasta/Running.html
+
+# For information on optimizing assembly performance see here:
+# https://chanzuckerberg.github.io/shasta/Performance.html
+
+
+[Reads]
+# Use this option to adjust coverage.
+minReadLength = 10000
+
+[ReadGraph]
+maxAlignmentCount = 20
+
+[Assembly]
+consensusCaller = Modal
+
+
+
diff -r 000000000000 -r 60573349e9ae macros.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/macros.xml Wed Nov 11 21:54:51 2020 +0000
@@ -0,0 +1,82 @@
+
+
+ 0.6.0
+ 18.01
+
+
+ shasta
+
+
+
+ shasta --version
+
+
+
+ 10.1038/s41587-020-0503-6
+ @online{shasta,
+ author = {TODOLastName,TODOFirstName},
+ title = {shasta},
+ year = 2020,
+ url = {https://github.com/chanzuckerberg/shasta},
+ urldate = {2020-11-05}
+ }
+
+
+
+ ./input_${counter}.${ext} &&
+ #elif $input.is_of_type("fastq.gz","fastqsanger.gz")
+ #set $ext = "fastq"
+ gzip -dcf '$input' > ./input_${counter}.${ext} &&
+ #elif $input.is_of_type("fastqsanger", "fastq"):
+ #set $ext = "fastq"
+ ### I tried symlinking but shasta still complained about file extensions
+ cp '$input' ./input_${counter}.${ext} &&
+ #elif $input.is_of_type("fasta"):
+ #set $ext = "fasta"
+ ### I tried symlinking but shasta still complained about file extensions
+ cp '$input' ./input_${counter}.${ext} &&
+ #end if
+#end for
+ ]]>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ `_ or the `github `_ .
+ ]]>
+
diff -r 000000000000 -r 60573349e9ae shasta.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/shasta.xml Wed Nov 11 21:54:51 2020 +0000
@@ -0,0 +1,832 @@
+
+
+ De novo assembly of long read sequencing data
+
+ macros.xml
+
+
+
+
+
+
+ &2
+ ]]>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ ^([0-9]*)?([KMG]bp?)?$
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ ^[0-9]+(,[0-9]+)*$
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ outputs["report_graphical_fragment_assembly"]
+
+
+ outputs["report_config"]
+
+
+ outputs["report_log"]
+
+
+
+
+ assembly["write_reads_by_assembled_segment"]
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ `_ (these files correspond to the packaged config files available for this tool).
+
+**Output**
+
+- Assembled genome (FASTA)
+- Graphical fragment assembly (optional) (.gfa1)
+- Log file (optional) (.txt)
+- Config file (optional) (.txt)
+- Read CSV detailing which reads align to which assembly fragments (optional) (.csv)
+- Coverage CSV List (optional) (list:.csv)
+
+**References**
+
+@REFERENCES@
+ ]]>
+
+
diff -r 000000000000 -r 60573349e9ae test-data/nanopore.fasta.gz
Binary file test-data/nanopore.fasta.gz has changed
diff -r 000000000000 -r 60573349e9ae test-data/out_config.txt
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/out_config.txt Wed Nov 11 21:54:51 2020 +0000
@@ -0,0 +1,100 @@
+[Reads]
+minReadLength = 10000
+desiredCoverage = 0
+noCache = False
+palindromicReads.skipFlagging = False
+palindromicReads.maxSkip = 100
+palindromicReads.maxDrift = 100
+palindromicReads.maxMarkerFrequency = 10
+palindromicReads.alignedFractionThreshold = 0.1
+palindromicReads.nearDiagonalFractionThreshold = 0.1
+palindromicReads.deltaThreshold = 100
+
+[Kmers]
+generationMethod = 0
+k = 10
+probability = 0.1
+enrichmentThreshold = 100
+file =
+
+[MinHash]
+version = 0
+m = 4
+hashFraction = 0.01
+minHashIterationCount = 10
+alignmentCandidatesPerRead = 20
+minBucketSize = 5
+maxBucketSize = 30
+minFrequency = 5
+allPairs = False
+
+[Align]
+alignMethod = 3
+maxSkip = 30
+maxDrift = 30
+maxTrim = 30
+maxMarkerFrequency = 10
+minAlignedMarkerCount = 100
+minAlignedFraction = 0.4
+matchScore = 6
+mismatchScore = -1
+gapScore = -1
+downsamplingFactor = 0.1
+bandExtend = 10
+maxBand = 1000
+sameChannelReadAlignment.suppressDeltaThreshold = 0
+suppressContainments = False
+
+[ReadGraph]
+creationMethod = 0
+maxAlignmentCount = 6
+minComponentSize = 100
+maxChimericReadDistance = 2
+crossStrandMaxDistance = 6
+containedNeighborCount = 6
+uncontainedNeighborCountPerDirection = 3
+removeConflicts = False
+markerCountPercentile = 0.015
+alignedFractionPercentile = 0.12
+maxSkipPercentile = 0.12
+maxDriftPercentile = 0.12
+maxTrimPercentile = 0.015
+
+[MarkerGraph]
+minCoverage = 10
+maxCoverage = 100
+minCoveragePerStrand = 0
+lowCoverageThreshold = 0
+highCoverageThreshold = 256
+maxDistance = 30
+edgeMarkerSkipThreshold = 100
+pruneIterationCount = 6
+simplifyMaxLength = 10,100,1000
+crossEdgeCoverageThreshold = 0
+refineThreshold = 0
+reverseTransitiveReduction = False
+peakFinder.minAreaFraction = 0.08
+peakFinder.areaStartIndex = 2
+
+[Assembly]
+crossEdgeCoverageThreshold = 3
+markerGraphEdgeLengthThresholdForConsensus = 1000
+consensusCaller = Bayesian:guppy-3.0.5-a
+storeCoverageData = False
+storeCoverageDataCsvLengthThreshold = 0
+writeReadsByAssembledSegment = True
+detangleMethod = 0
+detangle.diagonalReadCountMin = 1
+detangle.offDiagonalReadCountMax = 2
+detangle.offDiagonalRatio = 0.3
+iterative = False
+iterative.iterationCount = 3
+iterative.pseudoPathAlignMatchScore = 1
+iterative.pseudoPathAlignMismatchScore = -1
+iterative.pseudoPathAlignGapScore = -1
+iterative.mismatchSquareFactor = 3
+iterative.minScore = 0
+iterative.maxAlignmentCount = 6
+iterative.bridgeRemovalIterationCount = 3
+iterative.bridgeRemovalMaxDistance = 2
+
diff -r 000000000000 -r 60573349e9ae test-data/out_config2.txt
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/out_config2.txt Wed Nov 11 21:54:51 2020 +0000
@@ -0,0 +1,100 @@
+[Reads]
+minReadLength = 10000
+desiredCoverage = 0
+noCache = False
+palindromicReads.skipFlagging = False
+palindromicReads.maxSkip = 100
+palindromicReads.maxDrift = 100
+palindromicReads.maxMarkerFrequency = 10
+palindromicReads.alignedFractionThreshold = 0.1
+palindromicReads.nearDiagonalFractionThreshold = 0.1
+palindromicReads.deltaThreshold = 100
+
+[Kmers]
+generationMethod = 0
+k = 10
+probability = 0.1
+enrichmentThreshold = 100
+file =
+
+[MinHash]
+version = 0
+m = 4
+hashFraction = 0.01
+minHashIterationCount = 10
+alignmentCandidatesPerRead = 20
+minBucketSize = 5
+maxBucketSize = 30
+minFrequency = 5
+allPairs = False
+
+[Align]
+alignMethod = 3
+maxSkip = 30
+maxDrift = 30
+maxTrim = 30
+maxMarkerFrequency = 10
+minAlignedMarkerCount = 100
+minAlignedFraction = 0.4
+matchScore = 6
+mismatchScore = -1
+gapScore = -1
+downsamplingFactor = 0.1
+bandExtend = 10
+maxBand = 1000
+sameChannelReadAlignment.suppressDeltaThreshold = 0
+suppressContainments = False
+
+[ReadGraph]
+creationMethod = 0
+maxAlignmentCount = 6
+minComponentSize = 100
+maxChimericReadDistance = 2
+crossStrandMaxDistance = 6
+containedNeighborCount = 6
+uncontainedNeighborCountPerDirection = 3
+removeConflicts = False
+markerCountPercentile = 0.015
+alignedFractionPercentile = 0.12
+maxSkipPercentile = 0.12
+maxDriftPercentile = 0.12
+maxTrimPercentile = 0.015
+
+[MarkerGraph]
+minCoverage = 10
+maxCoverage = 100
+minCoveragePerStrand = 0
+lowCoverageThreshold = 0
+highCoverageThreshold = 256
+maxDistance = 30
+edgeMarkerSkipThreshold = 100
+pruneIterationCount = 6
+simplifyMaxLength = 10,100,1000
+crossEdgeCoverageThreshold = 0
+refineThreshold = 0
+reverseTransitiveReduction = False
+peakFinder.minAreaFraction = 0.08
+peakFinder.areaStartIndex = 2
+
+[Assembly]
+crossEdgeCoverageThreshold = 3
+markerGraphEdgeLengthThresholdForConsensus = 1000
+consensusCaller = Bayesian:guppy-3.0.5-a
+storeCoverageData = False
+storeCoverageDataCsvLengthThreshold = 0
+writeReadsByAssembledSegment = False
+detangleMethod = 0
+detangle.diagonalReadCountMin = 1
+detangle.offDiagonalReadCountMax = 2
+detangle.offDiagonalRatio = 0.3
+iterative = False
+iterative.iterationCount = 3
+iterative.pseudoPathAlignMatchScore = 1
+iterative.pseudoPathAlignMismatchScore = -1
+iterative.pseudoPathAlignGapScore = -1
+iterative.mismatchSquareFactor = 3
+iterative.minScore = 0
+iterative.maxAlignmentCount = 6
+iterative.bridgeRemovalIterationCount = 3
+iterative.bridgeRemovalMaxDistance = 2
+
diff -r 000000000000 -r 60573349e9ae test-data/out_fasta.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/out_fasta.fasta Wed Nov 11 21:54:51 2020 +0000
@@ -0,0 +1,2 @@
+>0 length 16594
+TCACCTTTCTGCGTTCTCCGGATTTTTTCGCACGTGACTGCCCAGTTCGCTAAGGCTCGATTCCGATCTTAGCTTCCGAAGCATCTCTGCGTACGAAGCCTCCTCCTGTCTTTTTTTTTACGATGAGTGCCTCTGCACCCGTGCTAGCATTCTTGGCGACAGATGCATAGCTGCCTCGGCTTGGACTCGTTAGGTATGGATGTCGCCTTTTCTTCACCGCTTGCCATCCAACGTAGGGTTGCTCTGCTTCGGCGCCTGGACTTTGGCACCTGCACCGTGGGTACCTGCGCATTTTGTGGAGCCTTTTGGTAGGCTTTGTACCTCCGTCTGGGTAGCGCTGCTCTTCAAGCGGTGCTCGCTAGTAGTACCTTCTTGTACAGCTCTATCGCCCCTGTTGTTAAGGGCTGAGAGTTCGGAAGCTATGCCCTTTGTCTCTCATGTGTGTCGTTGGGTCTCGAATGCGGATAGAAGGGGGGCTGATCTTGCCATTCATCCTGGTAAGTATGCCCCTCAGGTCCTCGTTCTGGAGAGCAGTGGTCAAGTCCGAAGACCGATGAGGGGAACCAGCTGGGGACTTCCCTCCCGTCTTTTGCGATGGCACGGCGATGTGGTCCATCGTCTTCTGACTTGTCGCGGTCGTAGATGCTGTAGGAGCCAATTTCTCCACCTCTACAGCATCGCTGCAGTCGATAGTCAACGGCGGCTGGGGCCTGCGTGCTCACCCCCTTTGCCACCGACGGGACCGAGATTCCGTCACCATGGGTCGGGTTACCGACTCCTCTGGTGGGGGATCTCGAAAGTCGGGAGCTCCTCCTGAACGGGTCGTTGCGATCAGGGGACTGCCCCCACTGCGCTGTCCATCAACCGAAGGATGGCCTAAGGTTACCTAGGGTCACGTAGGCCACGGATTTCCCCGGCTTTTACGGATGGAGGTTTGTACCGCCTCGACTCGGACACCAGAGCCTCTGCTTAGGCACCAGCACGGTGAGAGGATGATATTTGGTCTGTCCGCGACCTTTGTGCCTTTTCCTTTTCCCCTTTCTTAAAGACTTGTGCGCTCCCCAGTTACCAGAATCAAAATTAAATTAAATTAAAAAATTTCAACGGCTTAATTTTTAAATTTAATTTTGAATTTCGCGCCCTACTGTCGCAACACAACACTGATCACACGGTTGATCTGGCAACGCCCCTCCCTCTCCAGATCGTCCCGCTGCGCTATCAGCTGTTTATCCGCTGCAACAATCGCAAGATAATAAATTACCTATTTACATGAAACAGGCGCACAATTAACTTCGCGTGATTGCAGCGCAGAACTATGGCGCGACTCCACCGTGTGATTTTGCCAGTTTGCCGCACACACCGGCCGACACAACTTCTATGGTTTCGAGTATTTCGCGCCGCGTAATTTAAGACGTCCGTCTTCACGGCGATGTAGACTTGGTCTCCGCACCAGGATTGAGTGTCTAAGCCTGTGCGTTCAGGATTAAACTTTGGCAATACGACAGCATTGAGTTTTTGGGTCTCTTTGTGAGTTTTGCACTTCTTTTAACAGTTCAGAAAAATGGCGATTCTGCGACTCTAGAATTGTCAGCAAATTGTTTTCACTATTGTAGTATGCACACATATCGGTTAAGCACTGTACCTATGTGTATTCATAATTGTAGCACTCTGTTGCAATGTGTACATAAACAGTCCAGCACAAGTGTATACGTAATACGAGCACCCACTTGAGGGGCTAACATACATAATTGCCTGGTCAGCAGTTCTCCCGCTGGCCAAGCGCTGATCGCTTATATGTGTGCCTATACCACTCCTCCTCCAGCACCATCGCTCGGCGACAGTACATATATATATACATATATATAAGATACGCATATAAGCGTTGCTGCGCTGCAGGCTATGCCGGCAGCGCTGCTCCTCGACTTAGGCTAAGAAACCTTTGTATGTAGATCATAAGAGGATTGACGAATTAATTTCGAATGGAGCGGGACCTTCCCTGTTCCTCAAATTGGATCAAATAAAGAACAGCTAAAACACAAATGATCTATGACACAATGAAACTACAGGAAGTTGGAGTAGGCGGTCCCACTTCTGATGTCGGATCTGAATCACTTTATACTCGGCATCACTCTCTACAGCGGACACAAAGTAACAGAAAACGGTCGTTAACTTGAAATTAAAAATAAATCTGCGACAAGTACAGTTTGTCAAGAAACTGTTTACACACCGTGAAATAAGATGAATTTTTGATTTTAACGGTCAAAATTAAGGGTTATTTGCTTAATTAAACGCAATTTTTTTTTTAGGAAATATAATTAAACAATATTTATTTTACTTATAAATTAAAAAACAAATTCAAAATATCAAATATACAAGAAAATAAATAACAAACTTCCAAGTTTACACACTTTTGAGAGTGTCACTCTGCCCAAACCGTCATCTCTGGGATGAGCTGATAGGTCCACCTCCCCCCGTCGCGACGTTTGCCATCTGCTCTGCCATTCACCTAATAGCCACTCGTGTGCCTCTTGCCTGGAAGCGCCACTCCGCATAAGGCTGAGAGCCTTGATCTCCAGATCAATCGGCAGGCCTGCCAGCGCTAGCGCCGCGTCTTCGGATATGGTCCTGAATCCTCTAATGAGCCTGAGGGCCATTGACCGTAGCACCGAACGAGCTCCTTTCAGGTATGAGACCCTGCAAGTGGCATTGCTCCAGACTGGTGCAGCGTATAGCAGCGAAGCCTTTGCTACTGACACCAGCAGTTTCCTGGCCGGGTGTCTTGGGCCTCCGACGTTGGGCATGCCTCGCCAACGAAGAGGATGTGACTGCTGTCTTCTTGCTGGCGTAGCTCGCGTGGTCCTTGAACGATAGTCTGCGATCTATCATTACCCCCAGGTACTTTAGGGACTCTTGAGAGGTCCCCTGAGTACCCTTGACGGAGACCAGCATGTTCTCCATCTTTTCCTGCTGCTTAGTAGGACTGCTTCGGTCTTGTGAGCCGCTATTGCTAGCCCGGCTGTGATTGCCACATCGTCAGCGAAACAGCTGCCTCGACGACTTCAAGTTCTGTGACGCACGGGAAATCTGGGGCAGGGGCTGCCTCTGTTGGCCTCCATAGTGTGGTCTGCTTTGGAAATAGCTCCCCTAGTATGTTAGCCAGGACCCCCGGGTCGGATGGGGTTGCCGCTCCTCCTCCTCCTTAGCTGCTTGGTAACAAGCTTGTAGGCGAGGCCCCAGATATCGCTGTCTACGCCATCCTGCAGCTCCTTAAACGACCGCGCTTTGGCAGCCGCGATGCCGTGCTTGAACTCTAGGCGTTTGCTTCTGAAAGCCTCCAAGAGTTCCGCGTGGTGGAGTACTGCCTCTGGCTCGTTGCGCCGTTCTCTTAGCCCTGAGGCAATCAGACCGTAGTTGGCTTAGGGAGGCACTCCACCAGTAAACGGGTGGTTTGCGCTGTGCCTTATTTTTTCCTTGGCATGATTGCGTCGCAGATTCTTCCCAGCATATTCATGAGGCCTGCCGCCATACTCTCTGCGTCCACATTTGGGATTTCCAGGGGAATTGATCTGATAGGCCAGCATGGCCTCATCGATCTTCCTGGTGTCCCATGTTTTCCCGGCTGTTCTACTCTGCCGTCTTTTGGGCATGTCCCTCCGGGGAGAAGGAGATCAGGGCATGGTCGCTCAGCGTCATGACGTCATGGACCATCCAGTTGTTGTTGTCTACTAGCCCTCTGCTGACAAAGGTAACGTCAATAAAGGACGTACCCCTATCGTTGTTAAACGTCGGCTTCCGTCCATCGTTCAGCAGTATGAGGTCCAGCATTCGCATGGCGTCAATCACAGCTCGTCCTCTGGTGTTGGATGTCCTGCTGCCCCATTCCACTGTCCAGGCATTAAAGTCGCCGGTATGACCTTCGGGCTTGCCCTCTCGCATGGTCCACGAGCGCCTCCAGAAGCCCTCGAACTGATCGGGGGTGTCGCTCGGCGGAGCGTAGCAGCTGTACATGTGCACGTGTTTTAACTTCGCATAAGCGATACCCCGCATGGGTAAAGCAGCCAGTTCCTGGACTTGAGAGAGCTGCAGCATTTGATAGCTGCTTTTACCTGCCTCGTCAAGGATCATGGACGATTGTCCACTACCAGAGACGTAGGGTTCGCTTAGGAGCATGATGTCTACATTGCGCTCAACCGCAGTCTGGGCCAGGAGGCTCTGAGCTGCTGCGCAATGATTGACATTGAGCTGTACTACGCTAATATGAGCGTGCATTAAGGTGGCTCTTGGCATCTTTTAGTGTCGCTCTGTAAGTCGGGCACGCAAAGCTACCCGTCGGGTGGTTTCTGTCCACCTCGCTGCTGCAGATCAGGCATTTTGGTGCAGCAACGCACCCCTTTGCCTTGTGCCCACGCTCACCGCATCTAAGACAGCAGTCTGCCCTGTCAGTGTCCTTGCAGGTTGCTGATCGATGCCCATAGCCGAGACACCTGTAGCATCTCGTGGGTCGGACGTCCTGGGTGATACGACATCTTGACCATCCAACGATTATGGTGCCCTGTTTAAGGACTGGTATCGCAACGTTCGCGTTCAGCAGCACTGAGGCTATTTGCTTTGCAATTCCGCATACTGCGAAGGCCCCTGATATCTTCAGGATTTATCTGCAGGCCCTGGAATTGGGCGACCAAGCAGCTGTGGAGCTTCTCTGCTGTCGTAGCCTCGTCCAATCCGCTGCAAGATAGAGCTATTCTTTGCGCTCCCTGTGCGCACAGAGGTTAAGTCATTGAGCGCCGCTTCCAGGTCGCTCTTAAACTTGGGAACGCTTTCGAAGCTTTCCCCTCTACCTCAAGCAACAGATCACCTTTCTGCGTTCTCTCCGGATTTTTTCGCACGTGACTGCCCAGTTCGCTAAGGCTCGATTCCGATCTTAGCTTCCGAAGCATCTCTGCGTACGAAGCCTCTCCTGTCTTTTTACGATGAGTGCCTCTGCACCCGTGCTAGCATTCTTGGCGACAGATGCATAGCTGCCTGGCTTGGACTCGTTAGGTATGGATGTCGCCTTTTCTTCACCGTTGCCATCCAACGTAGGGTTGCTCTGCTTCGGCGCCTGGACTTTGGCACCTGCACCGTGGGTACCTGCGCATTTTGTGGAGCCTTTTGGTAGGCTTTTGTACCTCCGTCTGGGTAGCGCTGCTCTTCAAGCGGTGCTCGCTAAGTAGTACCTTCGTACAGCTCTATCGCCCTGTTGTTAAGGGCTGAGAGTTCGGAAGCTATGCCCTTTGTCTCATGTGTGTCGTTGGGTCTCGAATGCGGATAGAAGGGGGCTGATCTTGCCATTCATCCTGGTAAGTATGCCCCTCAGGTCTCGTTCTGGAGAGCAGTGGTCAAGTCCGAAGACCGATGAGGGGAACAAGCTGGGGACTTCCCTCCCGTCTTTTGCGATGGCACGGCGATGTGGTCCATCGTCTTCTGACTTGTCGCGGTCGTAGATGCTGTAGGAGCCAATTTCTCCACCTCTACAGCATCGCTGCAGTCGATAGTCAACGGCGGCTGGGGGCCTGCGTGCTCACCCCTTGCCACCGACGGGACCGAGATTCCGTCACCATGGGTCGGGTTACCGACTCCTCTGGTGGGGGGATCTCGAAAGTCGGGAGCTCCTCCTGAACGGGTCGTTGCGATCAGGGGACTGCCCCCCACTGCGCTGTCCATCAACTGAAGGATGGCCTAAGGTTACCTAGGGTCACGTAGGCCACGGATTTCCCCCTGGCTTTTACGGATGGAGGTTTGTACCGCCTCGACTCGGACACCAGAGCCTCTGCTTAGGCACCAGCACGGTGAGAGGATGATATTTGGTCTGTCCGCGACCTTTGTGCCTTTTCCCCTTTCTTAAAGACTTGTGCGCTCCCAGTTACCAGAATCAAAATTAAATTAAATTAAATTTCAACGGCTTAATTTTAAATTTAATTTTGAATTTCGCGCCCTACTGTCGCAACACAACACTGATCACACGGTTGATCTGGCAACGCCTCCCTCTCCAGATCGCCCGCTGCGCTATCAGCTGTTTATCCGCTGCAACAATCGCAAGATAATAAATTACCTATTTACATGAAACAGGCGCACAATTAACTCGCGTGATTGCAGCGCAGAACTATGGCGCGACTCCACCGTGTGATTTTGCCAGTTTGCCGCACACACCGGCCGACACAACTTCTATGGTTTCGAGTATTTCGCGCCGCGTAATTTAAGACGTCCGTCTTCACGGCGATGTAGACTTGGTCTCCGCACCAGGATTGAGTGTCTAAGCCTGTGCGTTCAGGATTAAACTTTGGCAATACGACAGCATTGAGTTTTTTGGGTCTCTTTGTGAGTTTTGCACTTCTTTTAACAGTTCAGAAAAATGGCGATTCTGCGACTCTAGAATTGTCAGCAAATTGTTTTCACTATTGTAGTATGCACACATATCGGTTAAGCACTGTACCTATGTGTATTCATAATTGTAGCACTCTGTTGCAATGTGTACATAAACAGTCCAGCACAAGTGTATACGTAATACGAGCACCCACTTGAGGGCTAACATACATAATTGCCTGGTCAGCAGTTCTCCCTGCTGGCAAGCGCTGATCGCTTATATGTGTGCCTATACCACTCCTCCTCCAGCACCATCGCTCGGCGACAGTACATATATATATACATATATATAAGATACGCATATAAGCGTTGCTGCGCTGCAGGCTATGCCGGCAGCGCTGCTCCTCGACTTAGGCTAAGAAACCTTTGTATGTAGATCATAAGAGGATTGACGAATTAATTTCGAATGGAGCGGGACCTTCCCTGTTCCTCAAATTGGATCAAATAAAGAACAGCTAAAACACAAATGATCTATGACACAATGAAACTACAGGAAGTTGGAGTAGGCGGTCCCACTTCTGATGTCGGATCTGAATCACTTTATACTCGGCATCACTCTCTACAGCGGACACAAAGTAACAGAAAACGGTCGTTAACTTGAAATTAAAATAAATCTGCGACAAGTACAGTTTGTCAAGAAACTGTTTACACACCGTGAAATAAGATGAATTTTTTGATTTTTAACGGTCAAAATTAAGGGTTATTTGCTTAATTAAACGCAATTTTTTTTTAGGAAATATAATTAAACAATATTTATTTTACTTATAAATTAAAAAACAAATTCAAAATATCAAATATACAAGAAAATAAACAACGAATTCCAAGTTTAAAGCACTTTTGAGAGTTTCAAGAAACTCTTTACACAAAAACACTAAACCTAAGTTTAATCCTAAATTTTTAAATTATTTTGTTAAAATTTGAAAAGTTGTAGTATTTAGTATGACCCCCCATTGGCTTTGGCTACAAGTTGAAGCTTTTTTTTCATGGAATGGATGAGTTTTTTTTAGGTCATATTCAAGCGGGATCTTTTCCCACTCTATCGCAGCCATGAGCTGTTGTCGTGTTTTGGTGCCCCTTTTGCCACATTCTTCTTTAAGTAGGCCCACAAATTTTCAATGGGGTTCAGATCAAGACTCTGAGGGGGCGTATCGATCACCTTGCCACAGTTATAAAGGAGCCAGTTGCGTACATTGCACTCTTTATGTTTTGGGATCATTGTCCTGATAAAACTTAAAATTTGGCTTGTTGTTGCTAAATAGACCAAATTTTTTCTGCACTGGCCTTCAAATTTGATTTTAAAATATCTAGATATTGCACGGCATTCATAGTGCTTTCAATAAAGGCTAATTTGCCCACTCCATGGCTTGAGATACAGCCCCAAATCATCACTGATAATTTTCCAAATTTGATTGTTGGAATGATATTTTGTTTTTTCTAGCGCACTCAACAGCTTGCGCCATACTCTGCTTGGCCCATCGTTATAATAGAGCATCATTTTTGTTTCGTCACAAAATATTACGTCATCCCAGTACTCTTCCGCATGATCCATCATGCTCACAGCGAATGAATGACGCTTTTCTATATTGACCTCTGATAGCAAAGGCTTTTTTTCTTGCAACTCTTGAAGAGTACCTATGGCGTAGAATGACTTGGCGCACAGTTTTGTGTGGCACAACTAGGTCACATTCTTGCCTGATATCCTGAGCAAGTGATCTGACCGAGATTCAGGGGGGTTCGCAATCACTTTTCGCATAATAAGGCGGTCTACACGCTTGCTAATTTTAGTTTTGCGCCCACCACTCTTAGGTTCAAGCCTGTTCTCTTTTTTCAAGCGATTAAAACATTGTAGACGGTCTTACGGGATACAGAAAACATTTATACTAATTCTGGAATAGATTTTCCCAACTGGTGGTTTTAGTATATTATTTGGGTCACTTCAAAAGCTAATCTATTTCCAGGCATTTTTATTAAATTTAATAACTCATTCGATCAGCAAAATTTCACAAGCAAAGTAAAAAAAATTTCAATAGAAGCGTTGTAAAAAGGAATGCAAATGCCAAAAATAACGGAAAAATCGAGTTCGTTCTAAGAAAAGAGCAAAACAAAGTAGGAAAACAAAATGTGTAAGGAGTTTCTTGCCACTCTCAAAAGTGTGTAAACTTGGAATTTGTTGTTTAATTTCTTGTATATTTGATATTTTGAATTTGTTTTTTTAATTTATAAGTAAAATAAATATTGTTTAATTATATTTCATTAAAAAATTGCGTTTAATTAAAGAAATAACCCTTAATTTTGATTTAAACCTTTAAAATGAAAAATTCAACTTATTTCACGGCGTGTAAATAGTTTCTTGACAAACTGTATATATCTACAAATTTACAACTTGCCGGTACCATCTGCAAGATTCATTACATTGAGAAGTGGACTTTGACTCTCAGAATGAATTAAAACATTATATTCTTAGATTGAACTGACGAGGAACCAGACTGAACTAACTAAACTAACTATCATTTAACTAAATTTAATTGTTTGCTGATAATTTTGAGTTTCTTACAAAGATGACTAATATTAATTTTTAGTTAAAATAGTTTGCAAAACTGAATTTATGTAAATAATATGTTCAATTGATCTGGTTGGGTTTTCTGGGTCTCCCCAACACCTCGCAACGAATGCTGGATCAAAATTATTCGTCAGAAGGACGTGCACAGTCTCGTGAGTAATAAAAGTACAGCAATCTTACTTTGAGGTGGCGTGTTGGAAAGTATGTACACATTTAAGCAAAAGTCACATGGCCTGCATCAAAGACACTAGAATAATAAGATGCGTAACAGCCATACACTGGTTTGGCACTATGCAGCCACTTTTTTTTGGTGACGGCCAAAATTGCTCTCTTTCCGCTCGCTCACGCTGAGCGTAAGAAATCTAAAATAGAATTTGCTTGCTTGTGTGAGTAAAAACAAAAGACGAGAACGCGTATATGTGTGCGTGTTGTGCTAGAAGGCGATTTTCGGGCCGAAATCAATTCTGATCGCAGTAACGAATTTACATATGTACATACATATTTGGGGAGTTTTGGCCAATTTCGTAGAATATGATGAAATTGCGCGCTGTTTAAGATATCAAATTGGAATATAAAAAAAACTGAAAAGAAGTCATTACACTGAGAAAAAATATTTCATAAAAAAATAATACGAAGTAGAAAATAAAAATTTATAAAATAAAAAAAAATGTTAACTGTTTATTGCAAACGTCATATCAAATTAGAATTATTCTAGTGTCTTTGCTTTGGTCATATCTTGAGGCACGAAGTGCGGACCAAAGCACTCAACAATCATTGTCTTCTTAATACTCAAGCAGAGCGACACCGACGAAGACCCTAACTGCTTTGAAATGGCGAAGTAAAATAAAATCAAAAAAAGAGACCAAGCCCCTCCCGAAGTTCAAAGAAAACAGGATTCCCTGGACAATTCATCAAGCACCAGCGCAAATAATTTCGCTCTCTTAAGCGACGGATTGCCCGACAAAACAGGAAACAAATATAACAAAACGAAGATCTCGAAATGGTAAAGTGAAGACAGTGCAACTGATTTTGCTAAGCCCCACCTATCTTTCTCTCTGACGTCAATGGTATAAGTGAAAAGCTAACCTATCTTAAAACTAAAATTAAGAGAACTTTTTTTTATTATAAGACTCAACGTTATGGACATGTAGAGGTAATGGTTAAAAGTATTGAAGAATTCTGAAAATTAGTCAAAACACTTAATAATGATTGTGTGCAGTACCACACATACCAGCTTAAGGATGACAGAGCATTTAGAGTTGTTATTAAGAATTTGCATTTTCCACAAATTTAGATGAAATTAAAAGTGATGAAGAGTCAAAAGGTCATGTTGTTAGAAACATAAGTAATATTAAAAAGCCGTGCGACCAAAACGTCACTGAACATGTTTTATGTAGATATTGAGCCTAACAAAAAAAACCTAGACATATATAATGTAAATAAAATATTGAGCCTCCCCACAATGAAATCGTTCAATGCTATAGCTGCCAGGAATTCGGACATACTAAATCATATTGTACCAAAACGTACCGCTGTGTAAAATCCTCTTCTCGACACCCAAGCAACATTTGCCCGAAAAATACAGAACAACCAGCAAAATGTGCCAACTGCTACGAAGAACACGCCGCCAGCTACAAAGGGTGTAGAATTTATCAGGAACTCTTGTCCAAAAAAAAATAGAAAATAGAAATAATGATCTGAGTAAAATGATTTAGGAATCCAGCAAAGTTTGTTCCGCCTAACAAGCCAACATATACCCAACAAAGTAACGATTATCAATCTTATGCCCAAATTGCTGCAGGAAATAGCAAAACAAACACATCACTGGAGAGAATAGAGCAACTATTAGGAAAACAGTCTGAACTTACAAATAATTTACTTAACATGATAATGTTACTTGTAAACAAATTATGCAAGTAAATCCTAACCTTGGAATATGGAAGCGTAGTAGGAGGTGACTTCAATGCTAAGCTTCCGAAGGGAAGAAACGAACTGTACAAATGCATAGTAAACAACAGCATAACAACACTTTCAACCGGCAAGCCTACATACTGGCCTACTGATAGTAGAAAGATACCAAACTTAACCCTTTCGCACCCAACGTTGCTTGTGAGCAATTTCTATGTTTTCAGAGCTAACTGTAAGTGTGCCTTTTGTTTTTATCTGCTGATTCTTTATGATAACGGTGCTTTTATGTGTCTACTCTAAATATAAAAGCAAAAAACGCATTTGGAGATTAATTGCAGGAATTATTTGCAATAAATAGCACGCGCATCACAATAATTATTGTTTCGATATTCGGTGCAACTTTTGGAATTATTAATTTACTTTTATAATACTTTAAAAAGAACCTAAAGTATAAACAGCAAAGAGTTAACAAGACAGTGATTTAGTCAAACTTAGTAAGTAGTGAACAATAAGTAAGTAAATAATTTTCTAAGTTGCTTGTGAGCAACCTTGGGCATTCGTGATAATAATTTTCACCGAAAGTGAAAGGTTTGTCTAACGAAAGAAATTGAACAGGGATTTAAACTTCGATTGGGATATTTCTACTGACGAAGAAAGTGGTGAGGAGATGAAAGACATTTCTACGGTACTGGAGAAGAATTTAGAAGGAATTCTTGAAAGGGGAGAAAGTATCGACATTGACCTTCTGGAAAATACAGTGATTGAAGGATGTGAACCTGACTCTTGCGTTGTTGTTGACAGTTGCTTAGAGAAAATTGATCCAAAGAGGCTAAAGTGGAGAACAAGGCCGTTTGTAGCTCCAGAGAGTATTTGGGAAGATGACAAAACTTTTGATGTCGGGGACATAAAGACGACCGTGGAGTTCTTCTACACACTTTTGATACTCAGCTAATTCATTTAATGGCTAGGCAAACTGATATACAGTCATGGTCAAAATTATTTTCACAAAGTGCATTTTTGTGCATGGGTCACAAACAGTTGCTTGTGCAGCAAGTGGGGGAGGTGAAATGCAAAAAAAACTTTTGCTTTTGCAAATTCAAACCTATGCAGAGTCAGATGAAAGAAGAATTGAAAAAATAACTGTTCCTATGCGCAAGGAAGAGGCAAATGAAGAGATCTTTATCAGTTGTCAGAAGTATTTGCACACGGTTTCGTCGCATCACAATTATTTTCACAACGCAATTTCTTCTTCAGTGATTGGTTTAGAGTGACAAGTGCCGGTTTGTTTGCTTAAATACATTTAAATTATTGAATAAAAAATTAGATTTAATCATTTTCCTATTACAGTTATTAAATAAAATGCCCAAAACAAAAGAGTTAACAGTTGAGGCCCGGGCTGGTATTGTTGCTAGGTTTAAAGCCGGTACACCTGCGGCCAAAATAGCTGAAATATATCAAATTTCGCGTAGAACTGTCTACTACTTAATAAAAAAAGTTTGATACAGTTGGCACATTAAAAAATAAAAAAAAGATCAGGCCGAAAACCTGTGCTGGACCAAAAGGCAATGCAGGCAAATACTTGGAGTTGTGGCGAAGAATCCTAGTGCCAGTCCGGTAAAAAATTGCCTTAGAATCAAAAAAATACAATTGGCAAACAAGTTAGTAGTTCTACAATTCGTCGCAGGCTAAAAGAAGCTGATTTTAAGACATACTTTGTTCGCAAAACGATTGAGATCACACCAACCAACAAAACAAAACGTCTTCGATTTGCGTTGGAATATGTTAAGAAGCCTCTTGACTTTTGGTTTAATATTTTATGGACTGATGAGTCTGCATTTCAGTACCAGGGGTCATACAGCAAGCATTTTATGCATTTGAAAAATAATCAAAAGCATTTGGCAGCCCAACCAACCAATAGATTTGGTGGTGGGGGCACAGTCATGTTTTGGGGATGTCTTTCCTATTATGGATTCGGAGACTTGGTACCGATAGAAGGTACTTTAAATCAGAACGGATACCTTCTTATCTTAAACAACCATGCTTTTACGTCTGGAAATAGACTTTTTCCAACTACTGAATGGATTCTTCAGCAGGACAATGCTCCATGCCATAAGGGTAGGATACCAACAAAATTTTTAAACGACCTTAATCTGGCGGTTCTTCCGTGGCCCCCCCCCAAAGCCCAGACCTTAATATCATTGAAAACGTTTGGGCTTTTATTAAAACCAACGAACTATTGATAAAAATAGAAAACGAGAGGGAGCCATCATTGAAATAGCGGAGATTTGGTCCAAATTGACATTAGAATTTGCACAAACTTTGGTAAGGTCAATACCAAAAGACTTCAAGCAGTTATTGATGCCAAAGGTGGTGTTACAAAATATTAGTATTGTATTTATATAAAATAAAGAAATTCTTATGTTGAAATTAGATGTTAAGCTGAAATTTACTAAATTAAGTTGAGTGAAAATACTTTTGAAGCGCAATAAACATGTGAAAATACTATTGACAACTTGCATGCATATTTTCTTTTGCTTTTAAGCTTTGTACTATGAACCGTTATCTTTCGTATTTCTTTTCGACTACCTTCTGCATAGATCAAGCTAAGCGATAAGAACTATTTCAGGCAAATCGGACAACAACAAGAAGAAATATAACAAAAGAAGTTGAAGTTTGCAAATATTGTGCGTTGTGAAAATACTTTGACCACCTCTGTATATAGTTTGCAGGAGCACGGTATTGAACTTAAATGTACTGATGAGGAAATCAAACGCTACATTGGCATTTTATTGTACTTTGGTGTTTTAAAACTACCGCAATTCAGAATGGCGTGGTCAAAGTATTTAAAGATTACCGCAATAACTGATTCAATGCCGCGTGGGAGATTTAAAAAAATAAAACAATGCTTACATTTCAACGACAACGCCAAACAATTAAAAAAAGGGGATTGCAACTATGATAAACTCTACAAGATCCGCCCTTTGTTCAGAATTCTCAAAGAAAATTTTGGAAAAACTAACGCAGGAAGAGCATCAAAGTGTCGATGAGCAAATAATTGCATTCAAAGGTACGTTTTAATTTTCTTTTAAATTAGCTTTATTTTTTAATAATTGCTTTTGTTGCAGGTCGATCCACGCTTAGGCAATATAATCCAAACCTCATAAATGGGGTCTTAAAATGTTTACGCGGGCTGGAATATCTGGATTAGTTTATGATTTTATTGCTATATGTTGGAGAAGGCACTTCTCCTTCTTATGGCTTGGGAATATCATCTTATGTTGTCTTATATTTGGCAGAAAGTCTTCCCAAAGACAAAATTTTAAACTGTATTTTGATAATTGGTTTACGTCTGTAATCCTTCTGATTTCGTTGAAGGAAATAGGAATCTTTGCAACAGGTACCTGTACGTATGATAAAGTTGAACATTGGGTAGTTTTTTGGAGAAAGAGGACGTTGCAGACTGTGCAAAATTGCAACACCGATGACCAAATGCCTTACATGCAAAGTCCATCTGTGCTGCAATAACAATAAAAACTGTTTTTTGTCATACCACACTTAAATTGTCATTATAAAGAAAAATATTTCATATTCTGTGATTTATAAAAAAAAAACAATGCTTACACATCACTACTGCCCGACGTTGCTCACAAGAAAACTTTTGCTACCGCCCAAACTAATGGGCGTGGCATACCTAAAATTTTGCTAAATTTTTTCTAAAATAAATGTAAAACATTAATGATAAAACAAAATTTCACGGGTAAAAAAGTTGGGCGCGAAAGGGTTAAAAGACTTCTGTAGCATACTTTGGAATCCCAGAATCTCACATGCGAATAATGGAAAGTTTTGATCTAAGCTCAGATCATTCTCTAATAATAGTGACATACAGTACAGTAGCTCATATATTGCAAATACAGATATCAATGCATTTAAAAGTTATCTGGAAACAGCTATCAGCCTGGATATCTCGCTAAAATCAGGAGAGGAGAGCTACTGTGGAGCTACTCACAAACAAGATCCATAAAGCAAGCTATATATGTACGAAGCTACCAGCCAGAAACTCACAATCAAATCAGCTCTATCTCTCAGCTGAAACTCCGACAACAAATACAACACAAGAGAAATTTGCGTAAGAGATGGCAAGAAACTCTCTACCCTGCCGACAAAAGATCGTATAACAAGGCTGCATCTGATCGCAGAAAACTACTGTCAACTTTAAGAAATTAATCTCTCGCTGAATATCTTAGAAATCTAGATCCACATTCTTGTAACCACGAACATAATTTATGGAGTAACCAAATATCTCAAGCGACCTGCAAAAGAAACACAGTAGTCCGAAACTCTAATGGCGAATGGCGTAGATCTGATGATGAACAAGCCAAAGCATTTGCTTAACACCTGCACTCTGTATTTCAGCCAAATGATATTGATAACCCGCAAACAGAAAGGGAAGTAGATAACTTTTTTCGAGTCACCGCCAAATGAGCTTACCCATTCGTAAAATCAGTATTAATGAAGTTTCATCAGAAATGGCTAAAAAGTAAAAAGGCTCCAGATTGGGACAAAATAGATGGCATAGCCTTGAAAAAAAAAATGGGCGGTTAGAGTTGACCACTTCCCAAGCCAATGGAAATGTGCAGAAATTATAGGAATCCTTAAACCAAACAAGGCAGAAAATGAAGTGACATTGTACCGTCCCATTAGTTTGTTGTCAATATTTTCTAAAGTATTTAAAAAAAATAATTTTAAAGAGAATGTTGTCAATCTTGGAAGAATTGCTATCATACCCAAACACCAGTTTGGATTCGAAGAGGCCACGGAACCCCTGAGCAATGTCACAGGATTAAAAAATGAAATTTCGTCAGCATTTGAGAGCAAAAAATACTGCACTGCTAAATTTCTTGACGTTTAACAAGCGTTTGATCGAGTCTGGCATGATGGCTTATCATATAAAACCATATTTTATATTATTAAAGTCATACTTAACCAATAGACAATTTTATTTGCAACAAAAAAATGAATACTCGCCCTTGCACTTTATAAAAGCTGGAGTCCCACAAGGAAGAGTCTTAGTAACTGTCTTATACACCCTGTAACGGCAGATATGCCGGTAACAAATACCGCCTGTAACAAATGATACAGCTATATTAGCTACAAGCTCATCTAAAGAGGAAGCCTCACAACTCCTGCAAGCAGAGCTACGCCTTATTGAAAGCTGGTTTCTTATTTGGAAAATTAAAGTCAACGCCCTGAAATCTGCGCAAATAACTTTTGCATTAAGAAGAGGTAACTGCCCAGAAGTGTCATTTAATGGATCAGCAATCCCACAAAGTATCGATCGCAGACTAACGTGGAAACACATAAACATAAAAGCAAAGCGCCAGCAACTAAATCAAAAAAGTTTGAAGATGACCTGGTTGCTTGGCCGAAAATCTGCAACCACTCGGAAAATAAAGTCCGTTTATACAAAGCTATACTAAAGCCCATGTGGACTTATGACATACAGCTTTGGGGTACTGCCAGCAACTCAAATATTGAGATTCTACAATGCTACCAATCAAAAAATATTAAGACAAATTGTTAATGCTCCATTTTATATTTCAAATGCAAGTATCTATAAAGACTTAGGAATCCCTTATGTTAAAGAAGAAATAGCAAAACATATTAAAAATATATAGACAGACCAAGAACACATGAAAATAACTTAGCCTTAAATTTGGTAAATAA
diff -r 000000000000 -r 60573349e9ae test-data/out_gfa.gfa1
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/out_gfa.gfa1 Wed Nov 11 21:54:51 2020 +0000
@@ -0,0 +1,2 @@
+H VN:Z:1.0
+S 0 TCACCTTTCTGCGTTCTCCGGATTTTTTCGCACGTGACTGCCCAGTTCGCTAAGGCTCGATTCCGATCTTAGCTTCCGAAGCATCTCTGCGTACGAAGCCTCCTCCTGTCTTTTTTTTTACGATGAGTGCCTCTGCACCCGTGCTAGCATTCTTGGCGACAGATGCATAGCTGCCTCGGCTTGGACTCGTTAGGTATGGATGTCGCCTTTTCTTCACCGCTTGCCATCCAACGTAGGGTTGCTCTGCTTCGGCGCCTGGACTTTGGCACCTGCACCGTGGGTACCTGCGCATTTTGTGGAGCCTTTTGGTAGGCTTTGTACCTCCGTCTGGGTAGCGCTGCTCTTCAAGCGGTGCTCGCTAGTAGTACCTTCTTGTACAGCTCTATCGCCCCTGTTGTTAAGGGCTGAGAGTTCGGAAGCTATGCCCTTTGTCTCTCATGTGTGTCGTTGGGTCTCGAATGCGGATAGAAGGGGGGCTGATCTTGCCATTCATCCTGGTAAGTATGCCCCTCAGGTCCTCGTTCTGGAGAGCAGTGGTCAAGTCCGAAGACCGATGAGGGGAACCAGCTGGGGACTTCCCTCCCGTCTTTTGCGATGGCACGGCGATGTGGTCCATCGTCTTCTGACTTGTCGCGGTCGTAGATGCTGTAGGAGCCAATTTCTCCACCTCTACAGCATCGCTGCAGTCGATAGTCAACGGCGGCTGGGGCCTGCGTGCTCACCCCCTTTGCCACCGACGGGACCGAGATTCCGTCACCATGGGTCGGGTTACCGACTCCTCTGGTGGGGGATCTCGAAAGTCGGGAGCTCCTCCTGAACGGGTCGTTGCGATCAGGGGACTGCCCCCACTGCGCTGTCCATCAACCGAAGGATGGCCTAAGGTTACCTAGGGTCACGTAGGCCACGGATTTCCCCGGCTTTTACGGATGGAGGTTTGTACCGCCTCGACTCGGACACCAGAGCCTCTGCTTAGGCACCAGCACGGTGAGAGGATGATATTTGGTCTGTCCGCGACCTTTGTGCCTTTTCCTTTTCCCCTTTCTTAAAGACTTGTGCGCTCCCCAGTTACCAGAATCAAAATTAAATTAAATTAAAAAATTTCAACGGCTTAATTTTTAAATTTAATTTTGAATTTCGCGCCCTACTGTCGCAACACAACACTGATCACACGGTTGATCTGGCAACGCCCCTCCCTCTCCAGATCGTCCCGCTGCGCTATCAGCTGTTTATCCGCTGCAACAATCGCAAGATAATAAATTACCTATTTACATGAAACAGGCGCACAATTAACTTCGCGTGATTGCAGCGCAGAACTATGGCGCGACTCCACCGTGTGATTTTGCCAGTTTGCCGCACACACCGGCCGACACAACTTCTATGGTTTCGAGTATTTCGCGCCGCGTAATTTAAGACGTCCGTCTTCACGGCGATGTAGACTTGGTCTCCGCACCAGGATTGAGTGTCTAAGCCTGTGCGTTCAGGATTAAACTTTGGCAATACGACAGCATTGAGTTTTTGGGTCTCTTTGTGAGTTTTGCACTTCTTTTAACAGTTCAGAAAAATGGCGATTCTGCGACTCTAGAATTGTCAGCAAATTGTTTTCACTATTGTAGTATGCACACATATCGGTTAAGCACTGTACCTATGTGTATTCATAATTGTAGCACTCTGTTGCAATGTGTACATAAACAGTCCAGCACAAGTGTATACGTAATACGAGCACCCACTTGAGGGGCTAACATACATAATTGCCTGGTCAGCAGTTCTCCCGCTGGCCAAGCGCTGATCGCTTATATGTGTGCCTATACCACTCCTCCTCCAGCACCATCGCTCGGCGACAGTACATATATATATACATATATATAAGATACGCATATAAGCGTTGCTGCGCTGCAGGCTATGCCGGCAGCGCTGCTCCTCGACTTAGGCTAAGAAACCTTTGTATGTAGATCATAAGAGGATTGACGAATTAATTTCGAATGGAGCGGGACCTTCCCTGTTCCTCAAATTGGATCAAATAAAGAACAGCTAAAACACAAATGATCTATGACACAATGAAACTACAGGAAGTTGGAGTAGGCGGTCCCACTTCTGATGTCGGATCTGAATCACTTTATACTCGGCATCACTCTCTACAGCGGACACAAAGTAACAGAAAACGGTCGTTAACTTGAAATTAAAAATAAATCTGCGACAAGTACAGTTTGTCAAGAAACTGTTTACACACCGTGAAATAAGATGAATTTTTGATTTTAACGGTCAAAATTAAGGGTTATTTGCTTAATTAAACGCAATTTTTTTTTTAGGAAATATAATTAAACAATATTTATTTTACTTATAAATTAAAAAACAAATTCAAAATATCAAATATACAAGAAAATAAATAACAAACTTCCAAGTTTACACACTTTTGAGAGTGTCACTCTGCCCAAACCGTCATCTCTGGGATGAGCTGATAGGTCCACCTCCCCCCGTCGCGACGTTTGCCATCTGCTCTGCCATTCACCTAATAGCCACTCGTGTGCCTCTTGCCTGGAAGCGCCACTCCGCATAAGGCTGAGAGCCTTGATCTCCAGATCAATCGGCAGGCCTGCCAGCGCTAGCGCCGCGTCTTCGGATATGGTCCTGAATCCTCTAATGAGCCTGAGGGCCATTGACCGTAGCACCGAACGAGCTCCTTTCAGGTATGAGACCCTGCAAGTGGCATTGCTCCAGACTGGTGCAGCGTATAGCAGCGAAGCCTTTGCTACTGACACCAGCAGTTTCCTGGCCGGGTGTCTTGGGCCTCCGACGTTGGGCATGCCTCGCCAACGAAGAGGATGTGACTGCTGTCTTCTTGCTGGCGTAGCTCGCGTGGTCCTTGAACGATAGTCTGCGATCTATCATTACCCCCAGGTACTTTAGGGACTCTTGAGAGGTCCCCTGAGTACCCTTGACGGAGACCAGCATGTTCTCCATCTTTTCCTGCTGCTTAGTAGGACTGCTTCGGTCTTGTGAGCCGCTATTGCTAGCCCGGCTGTGATTGCCACATCGTCAGCGAAACAGCTGCCTCGACGACTTCAAGTTCTGTGACGCACGGGAAATCTGGGGCAGGGGCTGCCTCTGTTGGCCTCCATAGTGTGGTCTGCTTTGGAAATAGCTCCCCTAGTATGTTAGCCAGGACCCCCGGGTCGGATGGGGTTGCCGCTCCTCCTCCTCCTTAGCTGCTTGGTAACAAGCTTGTAGGCGAGGCCCCAGATATCGCTGTCTACGCCATCCTGCAGCTCCTTAAACGACCGCGCTTTGGCAGCCGCGATGCCGTGCTTGAACTCTAGGCGTTTGCTTCTGAAAGCCTCCAAGAGTTCCGCGTGGTGGAGTACTGCCTCTGGCTCGTTGCGCCGTTCTCTTAGCCCTGAGGCAATCAGACCGTAGTTGGCTTAGGGAGGCACTCCACCAGTAAACGGGTGGTTTGCGCTGTGCCTTATTTTTTCCTTGGCATGATTGCGTCGCAGATTCTTCCCAGCATATTCATGAGGCCTGCCGCCATACTCTCTGCGTCCACATTTGGGATTTCCAGGGGAATTGATCTGATAGGCCAGCATGGCCTCATCGATCTTCCTGGTGTCCCATGTTTTCCCGGCTGTTCTACTCTGCCGTCTTTTGGGCATGTCCCTCCGGGGAGAAGGAGATCAGGGCATGGTCGCTCAGCGTCATGACGTCATGGACCATCCAGTTGTTGTTGTCTACTAGCCCTCTGCTGACAAAGGTAACGTCAATAAAGGACGTACCCCTATCGTTGTTAAACGTCGGCTTCCGTCCATCGTTCAGCAGTATGAGGTCCAGCATTCGCATGGCGTCAATCACAGCTCGTCCTCTGGTGTTGGATGTCCTGCTGCCCCATTCCACTGTCCAGGCATTAAAGTCGCCGGTATGACCTTCGGGCTTGCCCTCTCGCATGGTCCACGAGCGCCTCCAGAAGCCCTCGAACTGATCGGGGGTGTCGCTCGGCGGAGCGTAGCAGCTGTACATGTGCACGTGTTTTAACTTCGCATAAGCGATACCCCGCATGGGTAAAGCAGCCAGTTCCTGGACTTGAGAGAGCTGCAGCATTTGATAGCTGCTTTTACCTGCCTCGTCAAGGATCATGGACGATTGTCCACTACCAGAGACGTAGGGTTCGCTTAGGAGCATGATGTCTACATTGCGCTCAACCGCAGTCTGGGCCAGGAGGCTCTGAGCTGCTGCGCAATGATTGACATTGAGCTGTACTACGCTAATATGAGCGTGCATTAAGGTGGCTCTTGGCATCTTTTAGTGTCGCTCTGTAAGTCGGGCACGCAAAGCTACCCGTCGGGTGGTTTCTGTCCACCTCGCTGCTGCAGATCAGGCATTTTGGTGCAGCAACGCACCCCTTTGCCTTGTGCCCACGCTCACCGCATCTAAGACAGCAGTCTGCCCTGTCAGTGTCCTTGCAGGTTGCTGATCGATGCCCATAGCCGAGACACCTGTAGCATCTCGTGGGTCGGACGTCCTGGGTGATACGACATCTTGACCATCCAACGATTATGGTGCCCTGTTTAAGGACTGGTATCGCAACGTTCGCGTTCAGCAGCACTGAGGCTATTTGCTTTGCAATTCCGCATACTGCGAAGGCCCCTGATATCTTCAGGATTTATCTGCAGGCCCTGGAATTGGGCGACCAAGCAGCTGTGGAGCTTCTCTGCTGTCGTAGCCTCGTCCAATCCGCTGCAAGATAGAGCTATTCTTTGCGCTCCCTGTGCGCACAGAGGTTAAGTCATTGAGCGCCGCTTCCAGGTCGCTCTTAAACTTGGGAACGCTTTCGAAGCTTTCCCCTCTACCTCAAGCAACAGATCACCTTTCTGCGTTCTCTCCGGATTTTTTCGCACGTGACTGCCCAGTTCGCTAAGGCTCGATTCCGATCTTAGCTTCCGAAGCATCTCTGCGTACGAAGCCTCTCCTGTCTTTTTACGATGAGTGCCTCTGCACCCGTGCTAGCATTCTTGGCGACAGATGCATAGCTGCCTGGCTTGGACTCGTTAGGTATGGATGTCGCCTTTTCTTCACCGTTGCCATCCAACGTAGGGTTGCTCTGCTTCGGCGCCTGGACTTTGGCACCTGCACCGTGGGTACCTGCGCATTTTGTGGAGCCTTTTGGTAGGCTTTTGTACCTCCGTCTGGGTAGCGCTGCTCTTCAAGCGGTGCTCGCTAAGTAGTACCTTCGTACAGCTCTATCGCCCTGTTGTTAAGGGCTGAGAGTTCGGAAGCTATGCCCTTTGTCTCATGTGTGTCGTTGGGTCTCGAATGCGGATAGAAGGGGGCTGATCTTGCCATTCATCCTGGTAAGTATGCCCCTCAGGTCTCGTTCTGGAGAGCAGTGGTCAAGTCCGAAGACCGATGAGGGGAACAAGCTGGGGACTTCCCTCCCGTCTTTTGCGATGGCACGGCGATGTGGTCCATCGTCTTCTGACTTGTCGCGGTCGTAGATGCTGTAGGAGCCAATTTCTCCACCTCTACAGCATCGCTGCAGTCGATAGTCAACGGCGGCTGGGGGCCTGCGTGCTCACCCCTTGCCACCGACGGGACCGAGATTCCGTCACCATGGGTCGGGTTACCGACTCCTCTGGTGGGGGGATCTCGAAAGTCGGGAGCTCCTCCTGAACGGGTCGTTGCGATCAGGGGACTGCCCCCCACTGCGCTGTCCATCAACTGAAGGATGGCCTAAGGTTACCTAGGGTCACGTAGGCCACGGATTTCCCCCTGGCTTTTACGGATGGAGGTTTGTACCGCCTCGACTCGGACACCAGAGCCTCTGCTTAGGCACCAGCACGGTGAGAGGATGATATTTGGTCTGTCCGCGACCTTTGTGCCTTTTCCCCTTTCTTAAAGACTTGTGCGCTCCCAGTTACCAGAATCAAAATTAAATTAAATTAAATTTCAACGGCTTAATTTTAAATTTAATTTTGAATTTCGCGCCCTACTGTCGCAACACAACACTGATCACACGGTTGATCTGGCAACGCCTCCCTCTCCAGATCGCCCGCTGCGCTATCAGCTGTTTATCCGCTGCAACAATCGCAAGATAATAAATTACCTATTTACATGAAACAGGCGCACAATTAACTCGCGTGATTGCAGCGCAGAACTATGGCGCGACTCCACCGTGTGATTTTGCCAGTTTGCCGCACACACCGGCCGACACAACTTCTATGGTTTCGAGTATTTCGCGCCGCGTAATTTAAGACGTCCGTCTTCACGGCGATGTAGACTTGGTCTCCGCACCAGGATTGAGTGTCTAAGCCTGTGCGTTCAGGATTAAACTTTGGCAATACGACAGCATTGAGTTTTTTGGGTCTCTTTGTGAGTTTTGCACTTCTTTTAACAGTTCAGAAAAATGGCGATTCTGCGACTCTAGAATTGTCAGCAAATTGTTTTCACTATTGTAGTATGCACACATATCGGTTAAGCACTGTACCTATGTGTATTCATAATTGTAGCACTCTGTTGCAATGTGTACATAAACAGTCCAGCACAAGTGTATACGTAATACGAGCACCCACTTGAGGGCTAACATACATAATTGCCTGGTCAGCAGTTCTCCCTGCTGGCAAGCGCTGATCGCTTATATGTGTGCCTATACCACTCCTCCTCCAGCACCATCGCTCGGCGACAGTACATATATATATACATATATATAAGATACGCATATAAGCGTTGCTGCGCTGCAGGCTATGCCGGCAGCGCTGCTCCTCGACTTAGGCTAAGAAACCTTTGTATGTAGATCATAAGAGGATTGACGAATTAATTTCGAATGGAGCGGGACCTTCCCTGTTCCTCAAATTGGATCAAATAAAGAACAGCTAAAACACAAATGATCTATGACACAATGAAACTACAGGAAGTTGGAGTAGGCGGTCCCACTTCTGATGTCGGATCTGAATCACTTTATACTCGGCATCACTCTCTACAGCGGACACAAAGTAACAGAAAACGGTCGTTAACTTGAAATTAAAATAAATCTGCGACAAGTACAGTTTGTCAAGAAACTGTTTACACACCGTGAAATAAGATGAATTTTTTGATTTTTAACGGTCAAAATTAAGGGTTATTTGCTTAATTAAACGCAATTTTTTTTTAGGAAATATAATTAAACAATATTTATTTTACTTATAAATTAAAAAACAAATTCAAAATATCAAATATACAAGAAAATAAACAACGAATTCCAAGTTTAAAGCACTTTTGAGAGTTTCAAGAAACTCTTTACACAAAAACACTAAACCTAAGTTTAATCCTAAATTTTTAAATTATTTTGTTAAAATTTGAAAAGTTGTAGTATTTAGTATGACCCCCCATTGGCTTTGGCTACAAGTTGAAGCTTTTTTTTCATGGAATGGATGAGTTTTTTTTAGGTCATATTCAAGCGGGATCTTTTCCCACTCTATCGCAGCCATGAGCTGTTGTCGTGTTTTGGTGCCCCTTTTGCCACATTCTTCTTTAAGTAGGCCCACAAATTTTCAATGGGGTTCAGATCAAGACTCTGAGGGGGCGTATCGATCACCTTGCCACAGTTATAAAGGAGCCAGTTGCGTACATTGCACTCTTTATGTTTTGGGATCATTGTCCTGATAAAACTTAAAATTTGGCTTGTTGTTGCTAAATAGACCAAATTTTTTCTGCACTGGCCTTCAAATTTGATTTTAAAATATCTAGATATTGCACGGCATTCATAGTGCTTTCAATAAAGGCTAATTTGCCCACTCCATGGCTTGAGATACAGCCCCAAATCATCACTGATAATTTTCCAAATTTGATTGTTGGAATGATATTTTGTTTTTTCTAGCGCACTCAACAGCTTGCGCCATACTCTGCTTGGCCCATCGTTATAATAGAGCATCATTTTTGTTTCGTCACAAAATATTACGTCATCCCAGTACTCTTCCGCATGATCCATCATGCTCACAGCGAATGAATGACGCTTTTCTATATTGACCTCTGATAGCAAAGGCTTTTTTTCTTGCAACTCTTGAAGAGTACCTATGGCGTAGAATGACTTGGCGCACAGTTTTGTGTGGCACAACTAGGTCACATTCTTGCCTGATATCCTGAGCAAGTGATCTGACCGAGATTCAGGGGGGTTCGCAATCACTTTTCGCATAATAAGGCGGTCTACACGCTTGCTAATTTTAGTTTTGCGCCCACCACTCTTAGGTTCAAGCCTGTTCTCTTTTTTCAAGCGATTAAAACATTGTAGACGGTCTTACGGGATACAGAAAACATTTATACTAATTCTGGAATAGATTTTCCCAACTGGTGGTTTTAGTATATTATTTGGGTCACTTCAAAAGCTAATCTATTTCCAGGCATTTTTATTAAATTTAATAACTCATTCGATCAGCAAAATTTCACAAGCAAAGTAAAAAAAATTTCAATAGAAGCGTTGTAAAAAGGAATGCAAATGCCAAAAATAACGGAAAAATCGAGTTCGTTCTAAGAAAAGAGCAAAACAAAGTAGGAAAACAAAATGTGTAAGGAGTTTCTTGCCACTCTCAAAAGTGTGTAAACTTGGAATTTGTTGTTTAATTTCTTGTATATTTGATATTTTGAATTTGTTTTTTTAATTTATAAGTAAAATAAATATTGTTTAATTATATTTCATTAAAAAATTGCGTTTAATTAAAGAAATAACCCTTAATTTTGATTTAAACCTTTAAAATGAAAAATTCAACTTATTTCACGGCGTGTAAATAGTTTCTTGACAAACTGTATATATCTACAAATTTACAACTTGCCGGTACCATCTGCAAGATTCATTACATTGAGAAGTGGACTTTGACTCTCAGAATGAATTAAAACATTATATTCTTAGATTGAACTGACGAGGAACCAGACTGAACTAACTAAACTAACTATCATTTAACTAAATTTAATTGTTTGCTGATAATTTTGAGTTTCTTACAAAGATGACTAATATTAATTTTTAGTTAAAATAGTTTGCAAAACTGAATTTATGTAAATAATATGTTCAATTGATCTGGTTGGGTTTTCTGGGTCTCCCCAACACCTCGCAACGAATGCTGGATCAAAATTATTCGTCAGAAGGACGTGCACAGTCTCGTGAGTAATAAAAGTACAGCAATCTTACTTTGAGGTGGCGTGTTGGAAAGTATGTACACATTTAAGCAAAAGTCACATGGCCTGCATCAAAGACACTAGAATAATAAGATGCGTAACAGCCATACACTGGTTTGGCACTATGCAGCCACTTTTTTTTGGTGACGGCCAAAATTGCTCTCTTTCCGCTCGCTCACGCTGAGCGTAAGAAATCTAAAATAGAATTTGCTTGCTTGTGTGAGTAAAAACAAAAGACGAGAACGCGTATATGTGTGCGTGTTGTGCTAGAAGGCGATTTTCGGGCCGAAATCAATTCTGATCGCAGTAACGAATTTACATATGTACATACATATTTGGGGAGTTTTGGCCAATTTCGTAGAATATGATGAAATTGCGCGCTGTTTAAGATATCAAATTGGAATATAAAAAAAACTGAAAAGAAGTCATTACACTGAGAAAAAATATTTCATAAAAAAATAATACGAAGTAGAAAATAAAAATTTATAAAATAAAAAAAAATGTTAACTGTTTATTGCAAACGTCATATCAAATTAGAATTATTCTAGTGTCTTTGCTTTGGTCATATCTTGAGGCACGAAGTGCGGACCAAAGCACTCAACAATCATTGTCTTCTTAATACTCAAGCAGAGCGACACCGACGAAGACCCTAACTGCTTTGAAATGGCGAAGTAAAATAAAATCAAAAAAAGAGACCAAGCCCCTCCCGAAGTTCAAAGAAAACAGGATTCCCTGGACAATTCATCAAGCACCAGCGCAAATAATTTCGCTCTCTTAAGCGACGGATTGCCCGACAAAACAGGAAACAAATATAACAAAACGAAGATCTCGAAATGGTAAAGTGAAGACAGTGCAACTGATTTTGCTAAGCCCCACCTATCTTTCTCTCTGACGTCAATGGTATAAGTGAAAAGCTAACCTATCTTAAAACTAAAATTAAGAGAACTTTTTTTTATTATAAGACTCAACGTTATGGACATGTAGAGGTAATGGTTAAAAGTATTGAAGAATTCTGAAAATTAGTCAAAACACTTAATAATGATTGTGTGCAGTACCACACATACCAGCTTAAGGATGACAGAGCATTTAGAGTTGTTATTAAGAATTTGCATTTTCCACAAATTTAGATGAAATTAAAAGTGATGAAGAGTCAAAAGGTCATGTTGTTAGAAACATAAGTAATATTAAAAAGCCGTGCGACCAAAACGTCACTGAACATGTTTTATGTAGATATTGAGCCTAACAAAAAAAACCTAGACATATATAATGTAAATAAAATATTGAGCCTCCCCACAATGAAATCGTTCAATGCTATAGCTGCCAGGAATTCGGACATACTAAATCATATTGTACCAAAACGTACCGCTGTGTAAAATCCTCTTCTCGACACCCAAGCAACATTTGCCCGAAAAATACAGAACAACCAGCAAAATGTGCCAACTGCTACGAAGAACACGCCGCCAGCTACAAAGGGTGTAGAATTTATCAGGAACTCTTGTCCAAAAAAAAATAGAAAATAGAAATAATGATCTGAGTAAAATGATTTAGGAATCCAGCAAAGTTTGTTCCGCCTAACAAGCCAACATATACCCAACAAAGTAACGATTATCAATCTTATGCCCAAATTGCTGCAGGAAATAGCAAAACAAACACATCACTGGAGAGAATAGAGCAACTATTAGGAAAACAGTCTGAACTTACAAATAATTTACTTAACATGATAATGTTACTTGTAAACAAATTATGCAAGTAAATCCTAACCTTGGAATATGGAAGCGTAGTAGGAGGTGACTTCAATGCTAAGCTTCCGAAGGGAAGAAACGAACTGTACAAATGCATAGTAAACAACAGCATAACAACACTTTCAACCGGCAAGCCTACATACTGGCCTACTGATAGTAGAAAGATACCAAACTTAACCCTTTCGCACCCAACGTTGCTTGTGAGCAATTTCTATGTTTTCAGAGCTAACTGTAAGTGTGCCTTTTGTTTTTATCTGCTGATTCTTTATGATAACGGTGCTTTTATGTGTCTACTCTAAATATAAAAGCAAAAAACGCATTTGGAGATTAATTGCAGGAATTATTTGCAATAAATAGCACGCGCATCACAATAATTATTGTTTCGATATTCGGTGCAACTTTTGGAATTATTAATTTACTTTTATAATACTTTAAAAAGAACCTAAAGTATAAACAGCAAAGAGTTAACAAGACAGTGATTTAGTCAAACTTAGTAAGTAGTGAACAATAAGTAAGTAAATAATTTTCTAAGTTGCTTGTGAGCAACCTTGGGCATTCGTGATAATAATTTTCACCGAAAGTGAAAGGTTTGTCTAACGAAAGAAATTGAACAGGGATTTAAACTTCGATTGGGATATTTCTACTGACGAAGAAAGTGGTGAGGAGATGAAAGACATTTCTACGGTACTGGAGAAGAATTTAGAAGGAATTCTTGAAAGGGGAGAAAGTATCGACATTGACCTTCTGGAAAATACAGTGATTGAAGGATGTGAACCTGACTCTTGCGTTGTTGTTGACAGTTGCTTAGAGAAAATTGATCCAAAGAGGCTAAAGTGGAGAACAAGGCCGTTTGTAGCTCCAGAGAGTATTTGGGAAGATGACAAAACTTTTGATGTCGGGGACATAAAGACGACCGTGGAGTTCTTCTACACACTTTTGATACTCAGCTAATTCATTTAATGGCTAGGCAAACTGATATACAGTCATGGTCAAAATTATTTTCACAAAGTGCATTTTTGTGCATGGGTCACAAACAGTTGCTTGTGCAGCAAGTGGGGGAGGTGAAATGCAAAAAAAACTTTTGCTTTTGCAAATTCAAACCTATGCAGAGTCAGATGAAAGAAGAATTGAAAAAATAACTGTTCCTATGCGCAAGGAAGAGGCAAATGAAGAGATCTTTATCAGTTGTCAGAAGTATTTGCACACGGTTTCGTCGCATCACAATTATTTTCACAACGCAATTTCTTCTTCAGTGATTGGTTTAGAGTGACAAGTGCCGGTTTGTTTGCTTAAATACATTTAAATTATTGAATAAAAAATTAGATTTAATCATTTTCCTATTACAGTTATTAAATAAAATGCCCAAAACAAAAGAGTTAACAGTTGAGGCCCGGGCTGGTATTGTTGCTAGGTTTAAAGCCGGTACACCTGCGGCCAAAATAGCTGAAATATATCAAATTTCGCGTAGAACTGTCTACTACTTAATAAAAAAAGTTTGATACAGTTGGCACATTAAAAAATAAAAAAAAGATCAGGCCGAAAACCTGTGCTGGACCAAAAGGCAATGCAGGCAAATACTTGGAGTTGTGGCGAAGAATCCTAGTGCCAGTCCGGTAAAAAATTGCCTTAGAATCAAAAAAATACAATTGGCAAACAAGTTAGTAGTTCTACAATTCGTCGCAGGCTAAAAGAAGCTGATTTTAAGACATACTTTGTTCGCAAAACGATTGAGATCACACCAACCAACAAAACAAAACGTCTTCGATTTGCGTTGGAATATGTTAAGAAGCCTCTTGACTTTTGGTTTAATATTTTATGGACTGATGAGTCTGCATTTCAGTACCAGGGGTCATACAGCAAGCATTTTATGCATTTGAAAAATAATCAAAAGCATTTGGCAGCCCAACCAACCAATAGATTTGGTGGTGGGGGCACAGTCATGTTTTGGGGATGTCTTTCCTATTATGGATTCGGAGACTTGGTACCGATAGAAGGTACTTTAAATCAGAACGGATACCTTCTTATCTTAAACAACCATGCTTTTACGTCTGGAAATAGACTTTTTCCAACTACTGAATGGATTCTTCAGCAGGACAATGCTCCATGCCATAAGGGTAGGATACCAACAAAATTTTTAAACGACCTTAATCTGGCGGTTCTTCCGTGGCCCCCCCCCAAAGCCCAGACCTTAATATCATTGAAAACGTTTGGGCTTTTATTAAAACCAACGAACTATTGATAAAAATAGAAAACGAGAGGGAGCCATCATTGAAATAGCGGAGATTTGGTCCAAATTGACATTAGAATTTGCACAAACTTTGGTAAGGTCAATACCAAAAGACTTCAAGCAGTTATTGATGCCAAAGGTGGTGTTACAAAATATTAGTATTGTATTTATATAAAATAAAGAAATTCTTATGTTGAAATTAGATGTTAAGCTGAAATTTACTAAATTAAGTTGAGTGAAAATACTTTTGAAGCGCAATAAACATGTGAAAATACTATTGACAACTTGCATGCATATTTTCTTTTGCTTTTAAGCTTTGTACTATGAACCGTTATCTTTCGTATTTCTTTTCGACTACCTTCTGCATAGATCAAGCTAAGCGATAAGAACTATTTCAGGCAAATCGGACAACAACAAGAAGAAATATAACAAAAGAAGTTGAAGTTTGCAAATATTGTGCGTTGTGAAAATACTTTGACCACCTCTGTATATAGTTTGCAGGAGCACGGTATTGAACTTAAATGTACTGATGAGGAAATCAAACGCTACATTGGCATTTTATTGTACTTTGGTGTTTTAAAACTACCGCAATTCAGAATGGCGTGGTCAAAGTATTTAAAGATTACCGCAATAACTGATTCAATGCCGCGTGGGAGATTTAAAAAAATAAAACAATGCTTACATTTCAACGACAACGCCAAACAATTAAAAAAAGGGGATTGCAACTATGATAAACTCTACAAGATCCGCCCTTTGTTCAGAATTCTCAAAGAAAATTTTGGAAAAACTAACGCAGGAAGAGCATCAAAGTGTCGATGAGCAAATAATTGCATTCAAAGGTACGTTTTAATTTTCTTTTAAATTAGCTTTATTTTTTAATAATTGCTTTTGTTGCAGGTCGATCCACGCTTAGGCAATATAATCCAAACCTCATAAATGGGGTCTTAAAATGTTTACGCGGGCTGGAATATCTGGATTAGTTTATGATTTTATTGCTATATGTTGGAGAAGGCACTTCTCCTTCTTATGGCTTGGGAATATCATCTTATGTTGTCTTATATTTGGCAGAAAGTCTTCCCAAAGACAAAATTTTAAACTGTATTTTGATAATTGGTTTACGTCTGTAATCCTTCTGATTTCGTTGAAGGAAATAGGAATCTTTGCAACAGGTACCTGTACGTATGATAAAGTTGAACATTGGGTAGTTTTTTGGAGAAAGAGGACGTTGCAGACTGTGCAAAATTGCAACACCGATGACCAAATGCCTTACATGCAAAGTCCATCTGTGCTGCAATAACAATAAAAACTGTTTTTTGTCATACCACACTTAAATTGTCATTATAAAGAAAAATATTTCATATTCTGTGATTTATAAAAAAAAAACAATGCTTACACATCACTACTGCCCGACGTTGCTCACAAGAAAACTTTTGCTACCGCCCAAACTAATGGGCGTGGCATACCTAAAATTTTGCTAAATTTTTTCTAAAATAAATGTAAAACATTAATGATAAAACAAAATTTCACGGGTAAAAAAGTTGGGCGCGAAAGGGTTAAAAGACTTCTGTAGCATACTTTGGAATCCCAGAATCTCACATGCGAATAATGGAAAGTTTTGATCTAAGCTCAGATCATTCTCTAATAATAGTGACATACAGTACAGTAGCTCATATATTGCAAATACAGATATCAATGCATTTAAAAGTTATCTGGAAACAGCTATCAGCCTGGATATCTCGCTAAAATCAGGAGAGGAGAGCTACTGTGGAGCTACTCACAAACAAGATCCATAAAGCAAGCTATATATGTACGAAGCTACCAGCCAGAAACTCACAATCAAATCAGCTCTATCTCTCAGCTGAAACTCCGACAACAAATACAACACAAGAGAAATTTGCGTAAGAGATGGCAAGAAACTCTCTACCCTGCCGACAAAAGATCGTATAACAAGGCTGCATCTGATCGCAGAAAACTACTGTCAACTTTAAGAAATTAATCTCTCGCTGAATATCTTAGAAATCTAGATCCACATTCTTGTAACCACGAACATAATTTATGGAGTAACCAAATATCTCAAGCGACCTGCAAAAGAAACACAGTAGTCCGAAACTCTAATGGCGAATGGCGTAGATCTGATGATGAACAAGCCAAAGCATTTGCTTAACACCTGCACTCTGTATTTCAGCCAAATGATATTGATAACCCGCAAACAGAAAGGGAAGTAGATAACTTTTTTCGAGTCACCGCCAAATGAGCTTACCCATTCGTAAAATCAGTATTAATGAAGTTTCATCAGAAATGGCTAAAAAGTAAAAAGGCTCCAGATTGGGACAAAATAGATGGCATAGCCTTGAAAAAAAAAATGGGCGGTTAGAGTTGACCACTTCCCAAGCCAATGGAAATGTGCAGAAATTATAGGAATCCTTAAACCAAACAAGGCAGAAAATGAAGTGACATTGTACCGTCCCATTAGTTTGTTGTCAATATTTTCTAAAGTATTTAAAAAAAATAATTTTAAAGAGAATGTTGTCAATCTTGGAAGAATTGCTATCATACCCAAACACCAGTTTGGATTCGAAGAGGCCACGGAACCCCTGAGCAATGTCACAGGATTAAAAAATGAAATTTCGTCAGCATTTGAGAGCAAAAAATACTGCACTGCTAAATTTCTTGACGTTTAACAAGCGTTTGATCGAGTCTGGCATGATGGCTTATCATATAAAACCATATTTTATATTATTAAAGTCATACTTAACCAATAGACAATTTTATTTGCAACAAAAAAATGAATACTCGCCCTTGCACTTTATAAAAGCTGGAGTCCCACAAGGAAGAGTCTTAGTAACTGTCTTATACACCCTGTAACGGCAGATATGCCGGTAACAAATACCGCCTGTAACAAATGATACAGCTATATTAGCTACAAGCTCATCTAAAGAGGAAGCCTCACAACTCCTGCAAGCAGAGCTACGCCTTATTGAAAGCTGGTTTCTTATTTGGAAAATTAAAGTCAACGCCCTGAAATCTGCGCAAATAACTTTTGCATTAAGAAGAGGTAACTGCCCAGAAGTGTCATTTAATGGATCAGCAATCCCACAAAGTATCGATCGCAGACTAACGTGGAAACACATAAACATAAAAGCAAAGCGCCAGCAACTAAATCAAAAAAGTTTGAAGATGACCTGGTTGCTTGGCCGAAAATCTGCAACCACTCGGAAAATAAAGTCCGTTTATACAAAGCTATACTAAAGCCCATGTGGACTTATGACATACAGCTTTGGGGTACTGCCAGCAACTCAAATATTGAGATTCTACAATGCTACCAATCAAAAAATATTAAGACAAATTGTTAATGCTCCATTTTATATTTCAAATGCAAGTATCTATAAAGACTTAGGAATCCCTTATGTTAAAGAAGAAATAGCAAAACATATTAAAAATATATAGACAGACCAAGAACACATGAAAATAACTTAGCCTTAAATTTGGTAAATAA RC:i:105426
diff -r 000000000000 -r 60573349e9ae test-data/out_reads.csv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/out_reads.csv Wed Nov 11 21:54:51 2020 +0000
@@ -0,0 +1,59 @@
+AssembledSegmentId,EdgeCount,OrientedReadCount,OrientedReadId,VertexCount,EdgeCount
+0,478,29,1-0,138,109
+0,478,29,2-1,137,115
+0,478,29,3-1,85,69
+0,478,29,6-1,146,114
+0,478,29,8-1,161,130
+0,478,29,9-1,167,141
+0,478,29,10-1,223,196
+0,478,29,11-0,231,188
+0,478,29,13-0,292,229
+0,478,29,15-1,274,246
+0,478,29,16-1,262,213
+0,478,29,17-1,305,255
+0,478,29,19-0,139,103
+0,478,29,22-0,232,172
+0,478,29,23-0,360,330
+0,478,29,24-1,282,233
+0,478,29,26-0,346,301
+0,478,29,27-0,147,100
+0,478,29,28-0,245,230
+0,478,29,29-0,220,198
+0,478,29,30-1,179,149
+0,478,29,31-0,166,140
+0,478,29,33-1,140,126
+0,478,29,36-1,105,91
+0,478,29,38-0,90,82
+0,478,29,39-1,68,62
+0,478,29,40-1,85,76
+0,478,29,41-1,87,81
+0,478,29,42-1,77,69
+1,478,29,1-1,138,109
+1,478,29,2-0,137,115
+1,478,29,3-0,85,69
+1,478,29,6-0,146,114
+1,478,29,8-0,161,130
+1,478,29,9-0,167,141
+1,478,29,10-0,223,196
+1,478,29,11-1,231,188
+1,478,29,13-1,292,229
+1,478,29,15-0,274,246
+1,478,29,16-0,262,213
+1,478,29,17-0,305,255
+1,478,29,19-1,139,103
+1,478,29,22-1,232,172
+1,478,29,23-1,360,330
+1,478,29,24-0,282,233
+1,478,29,26-1,346,301
+1,478,29,27-1,147,100
+1,478,29,28-1,245,230
+1,478,29,29-1,220,198
+1,478,29,30-0,179,149
+1,478,29,31-1,166,140
+1,478,29,33-0,140,126
+1,478,29,36-0,105,91
+1,478,29,38-1,90,82
+1,478,29,39-0,68,62
+1,478,29,40-0,85,76
+1,478,29,41-0,87,81
+1,478,29,42-0,77,69