# HG changeset patch # User iuc # Date 1665560639 0 # Node ID 179342c7b86c7b5694305c35fbfb54d4c7860d25 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/medaka commit 4d3dfd4bcb567178107dcfd808ff03f9fec0bdbd diff -r 000000000000 -r 179342c7b86c all_fasta.loc.sample --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/all_fasta.loc.sample Wed Oct 12 07:43:59 2022 +0000 @@ -0,0 +1,18 @@ +#This file lists the locations and dbkeys of all the fasta files +#under the "genome" directory (a directory that contains a directory +#for each build). The script extract_fasta.py will generate the file +#all_fasta.loc. This file has the format (white space characters are +#TAB characters): +# +# +# +#So, all_fasta.loc could look something like this: +# +#apiMel3 apiMel3 Honeybee (Apis mellifera): apiMel3 /path/to/genome/apiMel3/apiMel3.fa +#hg19canon hg19 Human (Homo sapiens): hg19 Canonical /path/to/genome/hg19/hg19canon.fa +#hg19full hg19 Human (Homo sapiens): hg19 Full /path/to/genome/hg19/hg19full.fa +# +#Your all_fasta.loc file should contain an entry for each individual +#fasta file. So there will be multiple fasta files for each build, +#such as with hg19 above. +# diff -r 000000000000 -r 179342c7b86c convert_VCF_info_fields.py --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/convert_VCF_info_fields.py Wed Oct 12 07:43:59 2022 +0000 @@ -0,0 +1,164 @@ +#!/usr/bin/env python3 + +# Takes in VCF file annotated with medaka tools annotate and converts +# +# Usage statement: +# python convert_VCF_info_fields.py in_vcf.vcf out_vcf.vcf + +# 10/21/2020 - Nathan P. Roach, natproach@gmail.com + +import re +import sys +from collections import OrderedDict +from math import log10 + +import scipy.stats + + +def pval_to_phredqual(pval): + try: + ret = round(-10 * log10(pval)) + except ValueError: + ret = 2147483647 # transform pval of 0.0 to max signed 32 bit int + return ret + + +def parseInfoField(info): + info_fields = info.split(";") + info_dict = OrderedDict() + for info_field in info_fields: + code, val = info_field.split("=") + info_dict[code] = val + return info_dict + + +def annotateVCF(in_vcf_filepath, out_vcf_filepath): + """Postprocess output of medaka tools annotate. + + Splits multiallelic sites into separate records. + Replaces medaka INFO fields that might represent information of the ref + and multiple alternate alleles with simple ref, alt allele counterparts. + """ + + in_vcf = open(in_vcf_filepath, "r") + # medaka INFO fields that do not make sense after splitting of + # multi-allelic records + # DP will be overwritten with the value of DPSP because medaka tools + # annotate currently only calculates the latter correctly + # (https://github.com/nanoporetech/medaka/issues/192). + # DPS, which is as unreliable as DP, gets skipped and the code + # calculates the spanning reads equivalent DPSPS instead. + to_skip = {"SC", "SR", "AR", "DP", "DPSP", "DPS"} + struct_meta_pat = re.compile("##(.+)=") + header_lines = [] + contig_ids = set() + contig_ids_simple = set() + # parse the metadata lines of the input VCF and drop: + # - duplicate lines + # - INFO lines declaring keys we are not going to write + # - redundant contig information + while True: + line = in_vcf.readline() + if line[:2] != "##": + assert line.startswith("#CHROM") + break + if line in header_lines: + # the annotate tool may generate lines already written by + # medaka variant again (example: medaka version line) + continue + match = struct_meta_pat.match(line) + if match: + match_type, match_id, match_misc = match.groups() + if match_type == "INFO": + if match_id == "DPSP": + line = line.replace("DPSP", "DP") + elif match_id in to_skip: + continue + elif match_type == "contig": + contig_ids.add(match_id) + if not match_misc: + # the annotate tools writes its own contig info, + # which is redundant with contig info generated by + # medaka variant, but lacks a length value. + # We don't need the incomplete line. + contig_ids_simple.add(match_id) + continue + header_lines.append(line) + # Lets check the above assumption about each ID-only contig line + # having a more complete counterpart. + assert not (contig_ids_simple - contig_ids) + header_lines.insert(1, "##convert_VCF_info_fields=0.2\n") + header_lines += [ + '##INFO=\n', + '##INFO=\n', + '##INFO=\n', + '##INFO=\n', + '##INFO=\n', + '##INFO=\n', + '##INFO=\n', + line, + ] + + with open(out_vcf_filepath, "w") as out_vcf: + out_vcf.writelines(header_lines) + for line in in_vcf: + fields = line.split("\t") + info_dict = parseInfoField(fields[7]) + sr_list = [int(x) for x in info_dict["SR"].split(",")] + sc_list = [int(x) for x in info_dict["SC"].split(",")] + if len(sr_list) != len(sc_list): + print("WARNING - SR and SC are different lengths, " "skipping variant") + print(line.strip()) # Print the line for debugging purposes + continue + variant_list = fields[4].split(",") + dpsp = int(info_dict["DPSP"]) + ref_fwd, ref_rev = 0, 1 + dpspf, dpspr = (int(x) for x in info_dict["AR"].split(",")) + for i in range(0, len(sr_list), 2): + dpspf += sr_list[i] + dpspr += sr_list[i + 1] + for j, i in enumerate(range(2, len(sr_list), 2)): + dp4 = (sr_list[ref_fwd], sr_list[ref_rev], sr_list[i], sr_list[i + 1]) + dp2x2 = [[dp4[0], dp4[1]], [dp4[2], dp4[3]]] + _, p_val = scipy.stats.fisher_exact(dp2x2) + sb = pval_to_phredqual(p_val) + + as_ = (sc_list[ref_fwd], sc_list[ref_rev], sc_list[i], sc_list[i + 1]) + + info = [] + for code in info_dict: + if code in to_skip: + continue + val = info_dict[code] + info.append("%s=%s" % (code, val)) + + info.append("DP=%d" % dpsp) + info.append("DPSPS=%d,%d" % (dpspf, dpspr)) + + if dpsp == 0: + info.append("AF=NaN") + else: + af = (dp4[2] + dp4[3]) / dpsp + info.append("AF=%.6f" % af) + if dpspf == 0: + info.append("FAF=NaN") + else: + faf = dp4[2] / dpspf + info.append("FAF=%.6f" % faf) + if dpspr == 0: + info.append("RAF=NaN") + else: + raf = dp4[3] / dpspr + info.append("RAF=%.6f" % raf) + info.append("SB=%d" % sb) + info.append("DP4=%d,%d,%d,%d" % dp4) + info.append("AS=%d,%d,%d,%d" % as_) + new_info = ";".join(info) + fields[4] = variant_list[j] + fields[7] = new_info + out_vcf.write("\t".join(fields)) + in_vcf.close() + + +if __name__ == "__main__": + annotateVCF(sys.argv[1], sys.argv[2]) diff -r 000000000000 -r 179342c7b86c macros.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/macros.xml Wed Oct 12 07:43:59 2022 +0000 @@ -0,0 +1,188 @@ + + 1.7.2 + 0 + 21.01 + + + medaka + + + + + medaka + + + + + medaka --version + + + + @online{medaka, + author = {Oxford Nanopore Technologies Ltd.}, + title = {medaka}, + year = 2020, + url = {https://github.com/nanoporetech/medaka}, + urldate = {2020-05-06} + } + + + + + + reference.fa && + #else + ln -f -s '$reference_source.ref_file' reference.fa && + #end if + #else: + ln -f -s '$reference_source.ref_file.fields.path' reference.fa && + #end if + ]]> + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + `_ and `github `_. + ]]> + diff -r 000000000000 -r 179342c7b86c snp.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/snp.xml Wed Oct 12 07:43:59 2022 +0000 @@ -0,0 +1,169 @@ + + decodes probabilities to SNPs + + macros.xml + + + + &1 | tee '$out_log' +#else + raw.vcf ##output of medaka snp + 2>&1 | tee '$out_log' + && ln -s '$output_annotated.in_bam' in.bam + && ln -s '$output_annotated.in_bam.metadata.bam_index' in.bai + && medaka tools annotate --dpsp --pad $output_annotated.pad raw.vcf reference.fa in.bam tmp.vcf + && python '$__tool_directory__/convert_VCF_info_fields.py' tmp.vcf '$out_SNPs' +#end if + ]]> + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + output_log_bool + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff -r 000000000000 -r 179342c7b86c test-data/alignment.bam Binary file test-data/alignment.bam has changed diff -r 000000000000 -r 179342c7b86c test-data/all_fasta.loc --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/all_fasta.loc Wed Oct 12 07:43:59 2022 +0000 @@ -0,0 +1,1 @@ +ref_fasta ref_fasta ref_fasta ${__HERE__}/ref.fasta \ No newline at end of file diff -r 000000000000 -r 179342c7b86c test-data/annotate_vcf_test.pileup --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/annotate_vcf_test.pileup Wed Oct 12 07:43:59 2022 +0000 @@ -0,0 +1,3 @@ +NC_045512.2 45 G 31 CCCCACCCCCCccccccccc,ccCCC*,+3ttccCC ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ +NC_045512.2 685 A 75 .-9AAGTCATTT,-9aagtcattt,-9aagtcattt*.-9AAGTCATTT*G.-9AAGTCATTT.-9AAGTCATTT,-9aagtcattt*,-9aagtcattt,-9aagtcattt,-9aagtcattt,-9aagtcattt,,-9aagtcattt,-9aagtcattt,-9aagtcatttG.-9AAGTCATTT*,-9aagtcatttG.-9AAGTCATTT.-9AAGTCATTTG.-9AAGTCATTTG.-9AAGTCATTT.-9AAGTCATTT.-9AAGTCATTT.-9AAGTCATTT.-9AAGTCATTT*.-9AAGTCATTT*.-9AAGTCATTT.-9AAGTCATTT.-9AAGTCATTT.-9AAGTCATTT.-9AAGTCATTTG.-9AAGTCATTT.-9AAGTCATTT.-9AAGTCATTT.-9AAGTCATTT.-9AAGTCATTT.-9AAGTCATTT*,-9aagtcattt,-9aagtcattt*,-9aagtcattt,-9aagtcattt,-9aagtcattt,-9aagtcattt,-9aagtcattt,-9aagtcattt*,-4aagt,-9aagtcattt,-9aagtcattt**G,-9aagtcattt,-9aagtcattt,-9aagtcatttG,-9aagtcattt,-9aagtcattt*,-9aagtcattt* ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ +NC_045512.2 1813 T 51 ..-3AAA..-2AA..-1A*.-1A.-3AAA*..-1A..-1A.-2AA.-1A.-3AAA.-2AA.-2AA.-3AAA.,-1a,-1a,-6aaaaaa,,,-1a,,-2aa,-2aa,,-1a,-1a,*,-1a,-1a,+1a,-2aa,-1a,+1a,-1a,,-2aa.-3AAA,-1a.-2AA,-1a*,-2aa,-2aa ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ diff -r 000000000000 -r 179342c7b86c test-data/annotate_vcf_test.vcf --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/annotate_vcf_test.vcf Wed Oct 12 07:43:59 2022 +0000 @@ -0,0 +1,9 @@ +##fileformat=VCFv4.1 +##medaka_version=1.0.3 +##contig= +##FORMAT= +##FORMAT= +#CHROM POS ID REF ALT QUAL FILTER INFO FORMAT SAMPLE +NC_045512.2 45 . G C 46.359 PASS GT:GQ 1:46 +NC_045512.2 685 . AAAGTCATTT A 260.487 PASS GT:GQ 1:260 +NC_045512.2 1813 . TA T 11.034 PASS GT:GQ 1:11 diff -r 000000000000 -r 179342c7b86c test-data/annotated.vcf --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/annotated.vcf Wed Oct 12 07:43:59 2022 +0000 @@ -0,0 +1,16 @@ +##fileformat=VCFv4.1 +##medaka_version=1.0.3 +##contig= +##FORMAT= +##FORMAT= +##annotateVCFVersion=0.1 +##INFO= +##INFO= +##INFO= +##INFO= +##INFO= +##INFO= +#CHROM POS ID REF ALT QUAL FILTER INFO FORMAT SAMPLE +NC_045512.2 45 . G C 46.359 PASS DP=31;AF=0.900000;FAF=0.937500;RAF=0.857143;SB=6;DP4=0,2,15,12 GT:GQ 1:46 +NC_045512.2 685 . AAAGTCATTT A 260.487 PASS DP=75;AF=0.880000;FAF=0.789474;RAF=0.972973;SB=0;DP4=0,0,30,36 GT:GQ 1:260 +NC_045512.2 1813 . TA T 11.034 PASS DP=51;AF=0.607843;FAF=0.521739;RAF=0.678571;SB=0;DP4=0,0,12,19 GT:GQ 1:11 diff -r 000000000000 -r 179342c7b86c test-data/assembly.fasta --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/assembly.fasta Wed Oct 12 07:43:59 2022 +0000 @@ -0,0 +1,56 @@ +>4 length=3792 depth=114.52x circular=true +TTGCGGTGTCTGCGTCAGAATCGCGTTCAGCGCGTTTCAGCGGTGCGTACAATTACAGCATTATGTTAAA +TTTTATAATTGTCTTTAGTCATTGCGCTATGATTTTGTAGGTGGAGTTGTTTCATATTTTTGATATAAAT +TCTTTTATCTCACTGAAGCAGTCATCGTCAGTATCAATGGTTTTGTTCTTCATTGATATGCCTATTCTAG +AATCTGATTCCTTATTACAACTAAGGTAAACTTGAACTTTTGCTTTCTTTTCATTATTTGGGTAAGCGTA +ATCAGGATCTAAGGATGTAATAATAGATTCTTGTTCTTTTATTTTATTGAATAGATCGTCTATATATCTA +AACACCTCTTTCTTACACGCGTGAGCAATGATTAGATCTTCTATTGCGCCATTCTTGTTTTTTCCTGGCA +TGATAAAGAAAGATATTTTTGTGCTTCCGTTAATGGCTATTTCATTATGCGAGCTTGGTGATGAAATGTT +AAGCTCATTTAATGTTGAAATTATCGATCTTTCCGTGTCAGAAAACGATTCGTCGGCATCGATGATTAAG +AATATACTTTCTTTTTCATTAAAAGACTCTATGCTTTTAAATGCTCTAAGGGTTTGTTTTAGTTTTGTCT +TTCCATTTATTTTTTCAACATAAACATCATTAATTCCTTCTATTTCAAGTAGATTGCAAAGGAAGTGAAA +ATCATCATCACCCTCAACGAAAATGACTTTTTTATAATCATTTATTTTTCTCGGTTTCATTTATCTCACC +TCCCAGCCATTTTCAACTGAAAAAGAAAAATCATCCATGTTAAATTGCATTGCTGTAGGTTTTTGAGATT +CCTTGTCTCTTCCCAGTCTTATGTAAGATATATCTTTTCTTTTTTCATCTAATTCGTTTATCGCACATAT +TACATCATGGCTGTGTGTTGTTGTAAATATTTGATTATTATTGGTTTTTGCTGCTTCTATCAAAGCGTTG +ATCATATCTTTGATTACTGAGTAATGAATTCCATTTTCTATCTCATCAATGAGAATAATTGAGTCTTTTT +GAACTAAGATTGAGCTAATGAAAGACAGCGCTCTGCTTACTCCTTCACCAAGCATTGATATTTCATTTAA +TTCACTTAGTCCTATATCTAAAAAAATCTCTTTGTTTTGATCTGTTGCTATTATTGCAATATCGTTAATT +CTATTATCTATTCTTTTTAGGTTGCCTATTATTTCATCTTTTCTTTTTTGTGTTAGTAGTTTTGATACGT +TTTTTATCGTTGCTTCTTTGTTTATGTTTCTTGATGTGGTTATTATCGCTGCGGTTTTGAATTCATATAG +CTTACCTTTTTTAGTTTGTTTTATTTCTCCGTTTATTTCTTGTGCTTTTTGTGTTATTTTTATAGTAATC +AATTCTTCTGGGGGGGTTCTTTTTCCGTTCTGTGTTTCACTAACCTTAATCATTAAAACATTCCCCTTTT +CCTGAGAGCCGAGGGTTTGTCGCAATGGAGGGGTGTTTGATAATATTGACTCAACATTGAGGGACACGCT +TGATTCACTTTGTGTGTTATCTATCGTTGAGTATTTTTGTGTTACTTCTGACCTTTCATCTCTTATTGTT +ATGGACATTTCTTTGGATGTGTCCATGTTATAAAAATAGCTATCCCAAAATGAGTTTTCTTTATTTAAAA +GAGATGCTTCATTTCTAAAGCTTTTTACTTTTAACAGAGCTGCTGGGTTTTTTACGTCATAAAATGAAAA +TATCGCGTCTAATATCGATGTTTTCCCAAAGTTGTTTTTTCCGGATATTACATTAAGTGTTTTTAGTTGT +TTGAGAGTTATGCTCTCGAAACACTTAAAATTTTTTAAGTGGATATCTTTTATCATGTTTAAACTTGCTC +TCCATTTCTGTTTACGTTTACATAGTAATAATGTGTTTATTTATGCATCACTATGCCACTGTTTCTTTTC +TAGAAGTATAATCAAAATAATATTACTTTATAGTCCTGTTTGGATTGATTTTAACCAGTTTGTCGGAGTT +TCTTCTTGTGATTATTGTGTTCTGGTCGTAATCTCCTAAACTGAAAACGAAAAAACCACCTGGGGAGGTG +GTTTGATCGAAGGTTAAGTCAGTTGGGGAACTGCTTAACCAGGTAACTGTCTTGTGCGAGACGAGTCACC +AAAACTGTCCTTTCAGTGTAGCTGTAGTCAGGCCATCACTTCAAGTACTCTCTTGAACCTCTCGCACATC +GACTTTTACCAATGGCTGCTGCCAGTGGCGCTTTGTCGTGTCTTACCGGGTTGGACTCAAGACGATAGTT +ACCGGATAAGGCGCAGCGGTCGGGCTGAACGGGGGGTTCGTGCACACAGCCCAGCTTGGAGCGAACGACC +TACACCGAACCGAGATACCTACAGCGTGAGCTATGAGAAAGCGCCACGCTTCCCGAAGGGAGAAAGGCGG +ACAGGTATCCGGTAAGCGGCAGGGTCGGAACAGGAGAGCGCACGAGGGAGCTTCCAGGGGGAAACACCTG +GTATCTTTATAGTCCTGTCGGGTTTCGCCACCTCTGGCTTGAGCGTCGATTTTTGTGATGCTCGTCAGGG +GGGCGGAGCCTATGGAAAAACGCCTGCGGCGCTGGCTTCCTCCGGTGCTTTGCTTTTTGCTCACATGTTC +TTTCCGACTTTATCCCCCGATTCTGTGGATAACCGTATTACCGCTTTTGAGTGAGCTGACACCGCTCGCC +GCAGTCGAACGACCGAGCGTAGCGAGTCAGTGAGCGAGGAAGCGGAAGAGCGCCTTATGTGACATTTTCT +CCTTACGCTCTGTTGTGCCGTTCGGCATCCTGTCCTGAGCGTTATCTCTCTGTGCTATTTTCTACTTCAA +AGCGTGTCTGGATGCTGTTCTGGAGTTCTTCTGCGAGTTCGTGCAGCTTCTCACACATGGCAGCCTGTTC +GTCAGCATCGGGTGCGTCCAGTTTTTCGAGCAGCGTCAGGCTCTGACTTTTTATGAATCCCGCCATGTTG +AGTACGGCTTGCTGCTGCTTGTTCATCTTTTCGTTTTCTCCGTTCTGTCTGTCATCTGCGTTGTGTGATT +ATATCGCGTACCACTTTTCGACTGTTTTGCTGCCGTTATTCTGCCGCTTGGCTTTTTGACGGGCATTTCT +GTCAGACAACACTGTCACTGCCAAAAAACTGCCGTGCCTTTGTCGGTAATTCGAGCTTGCTGACAGGACA +GGATGTGCAATTGTTATACCGCGCATACATGCACGCTATTACAATTGCCCTGGTCAGGGCTTTGCCCCGA +CACCCATGTCAGATACGGAGCCATGTTTTATGACAAAACGAAGTGGAAGTAATACGCGCAGGCGGGCTAT +CAGTCGCCCTGTTCGTCTGACGGCAGAAGAAGACCAGGAAATCAGAAAAAGGGCTGCTGAATGCGGCAAG +ACCGTTTCCGGTTTTTTACGGGCGGCAGCTCTCGGTAAGAAAGTTAACTCACTGACTGATGATCGGGTAC +TGAAAGAAGTTATGAGACTGGGGGCGTTACAGAAAAAACTCTTTATCGACGGCAAGCGTGTCGGGGACAG +GGAGTATGCGGAGGTGCTGATCGCTATTACGGAGTATCACCGTGCCCTGTTATCCAGACTTATGGCAGAT +TAGCTTCCCGGAGAGAAAACTGTCGAAAACAGACGGTATGAACACCGTAAGCTCCCAAAGTGATCACCAT +TCGCTTTCATGCATAGCTATGCAGCGAGCTGAAAACGATCCTGACGCATCCTTCCTGTTTTCCCGGGGTA +AAACATCTCTTT \ No newline at end of file diff -r 000000000000 -r 179342c7b86c test-data/basecalls.fastq.gz Binary file test-data/basecalls.fastq.gz has changed diff -r 000000000000 -r 179342c7b86c test-data/consensus.hdf Binary file test-data/consensus.hdf has changed diff -r 000000000000 -r 179342c7b86c test-data/medaka_test.bam Binary file test-data/medaka_test.bam has changed diff -r 000000000000 -r 179342c7b86c test-data/medaka_test.bam.bai Binary file test-data/medaka_test.bam.bai has changed diff -r 000000000000 -r 179342c7b86c test-data/medaka_test.hdf Binary file test-data/medaka_test.hdf has changed diff -r 000000000000 -r 179342c7b86c test-data/ref.fasta --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/ref.fasta Wed Oct 12 07:43:59 2022 +0000 @@ -0,0 +1,2 @@ +>NC_045512.2 +attaaaggtttataccttcccaggtaacaaaccaaccaactttcgatctcttgtagatctgttctctaaacgaactttaaaatctgtgtggctGTCACTCGGCTGCATGCTTAGTGCACTCACGCAGTATAATTAATAACTAATTACTGTCGTTGACAGGACACGAGTAACTCGTCTATCTTCTGCAGGCTGCTTACGGTTTCGTCCGTGTTGCAGCCGATCATCAGCACATCTAGGTTTCGTCCGGGTGTGACCGAAAGGTAAGATGGAGAGCCTTGTCCCTGGTTTCAACGAGAAAACACACGTCCAACTCAGTTTGCCTGTTTTACAGGTTCGCGACGTGCTCGTACGTGGCTTTGGAGACTCCGTGGAGGAGGTCTTATCAGAGGCACGTCAACATCTTAAAGATGGCACTTGTGGCTTAGTAGAAGTTGAAAAAGGCGTTTTGCCTCAACTTGAACAGCCCTATGTGTTCATCAAACGTTCGGATGCTCGAACTGCACCTCATGGTCATGTTATGGTTGAGCTGGTAGCAGAACTCGAAGGCATTCAGTACGGTCGTAGTGGTGAGACACTTGGTGTCCTTGTCCCTCATGTGGGCGAAATACCAGTGGCTTACCGCAAGGTTCTTCTTCGTAAGAACGGTAATAAAGGAGCTGGTGGCCATAGTTACGGCGCCGATCTAAAGTCATTTGACTTAGGCGACGAGCTTGGCACTGATCCTTATGAAGATTTTCAAGAAAACTGGAACACTAAACATAGCAGTGGTGTTACCCGTGAACTCATGCGTGAGCTTAACGGAGGGGCATACACTCGCTATGTCGATAACAACTTCTGTGGCCCTGATGGCTACCCTCTTGAGTGCATTAAAGACCTTCTAGCACGTGCTGGTAAAGCTTCATGCACTTTGTCCGAACAACTGGACTTTATTGACACTAAGAGGGGTGTATACTGCTGCCGTGAACATGAGCATGAAATTGCTTGGTACACGGAACGTTCTGAAAAGAGCTATGAATTGCAGACACCTTTTGAAATTAAATTGGCAAAGAAATTTGACACCTTCAATGGGGAATGTCCAAATTTTGTATTTCCCTTAAATTCCATAATCAAGACTATTCAACCAAGGGTTGAAAAGAAAAAGCTTGATGGCTTTATGGGTAGAATTCGATCTGTCTATCCAGTTGCGTCACCAAATGAATGCAACCAAATGTGCCTTTCAACTCTCATGAAGTGTGATCATTGTGGTGAAACTTCATGGCAGACGGGCGATTTTGTTAAAGCCACTTGCGAATTTTGTGGCACTGAGAATTTGACTAAAGAAGGTGCCACTACTTGTGGTTACTTACCCCAAAATGCTGTTGTTAAAATTTATTGTCCAGCATGTCACAATTCAGAAGTAGGACCTGAGCATAGTCTTGCCGAATACCATAATGAATCTGGCTTGAAAACCATTCTTCGTAAGGGTGGTCGCACTATTGCCTTTGGAGGCTGTGTGTTCTCTTATGTTGGTTGCCATAACAAGTGTGCCTATTGGGTTCCACGTGCTAGCGCTAACATAGGTTGTAACCATACAGGTGTTGTTGGAGAAGGTTCCGAAGGTCTTAATGACAACCTTCTTGAAATACTCCAAAAAGAGAAAGTCAACATCAATATTGTTGGTGACTTTAAACTTAATGAAGAGATCGCCATTATTTTGGCATCTTTTTCTGCTTCCACAAGTGCTTTTGTGGAAACTGTGAAAGGTTTGGATTATAAAGCATTCAAACAAATTGTTGAATCCTGTGGTAATTTTAAAGTTACAAAAGGAAAAGCTAAAAAAGGTGCCTGGAATATTGGTGAACAGAAATCAATACTGAGTCCTCTTTATGCATTTGCATCAGAGGCTGCTCGTGTTGTACGATCAATTTTCTCCCGCACTCTTGAAACTGCTCAAAATTCTGTGCGTGTTTTACAGAAGGCCGCTATAACAATACTAGATGGAATTTCACAGTATTCACTGAGACTCATTGATGCTATGATGTTCACATCTGATTTGGCTACTAACAATCTAGTTGTAATGGCCTACATTACAGGTGGTGTTGTTCAGTTGACTTCGCAGTGGCTAACTAACATCTTTGGCACTGTTTATGAAAAACTCAAACCCGTCCTTGATTGGCTTGAAGAGAAGTTTAAGGAAGGTGTAGAGTTTCTTAGAGACGGTTGGGAAATTGTTAAATTTATCTCAACCTGTGCTTGTGAAATTGTCGGTGGACAAATTGTCACCTGTGCAAAGGAAATTAAGGAGAGTGTTCAGACATTCTTTAAGCTTGTAAATAAATTTTTGGCTTTGTGTGCTGACTCTATCATTATTGGTGGAGCTAAACTTAAAGCCTTGAATTTAGGTGAAACATTTGTCACGCACTCAAAGGGATTGTACAGAAAGTGTGTTAAATCCAGAGAAGAAACTGGCCTACTCATGCCTCTAAAAGCCCCAAAAGAAATTATCTTCTTAGAGGGAGAAACACTTCCCACAGAAGTGTTAACAGAGGAAGTTGTCTTGAAAACTGGTGATTTACAACCATTAGAACAACCTACTAGTGAAGCTGTTGAAGCTCCATTGGTTGGTACACCAGTTTGTATTAACGGGCTTATGTTGCTCGAAATCAAAGACACAGAAAAGTACTGTGCCCTTGCACCTAATATGATGGTAACAAACAATACCTTCACACTCAAAGGCGGTGCACCAACAAAGGTTACTTTTGGTGATGACACTGTGATAGAAGTGCAAGGTTACAAGAGTGTGAATATCACTTTTGAACTTGATGAAAGGATTGATAAAGTACTTAATGAGAAGTGCTCTGCCTATACAGTTGAACTCGGTACAGAAGTAAATGAGTTCGCCTGTGTTGTGGCAGATGCTGTCATAAAAACTTTGCAACCAGTATCTGAATTACTTACACC diff -r 000000000000 -r 179342c7b86c test-data/ref.fasta.fai --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/ref.fasta.fai Wed Oct 12 07:43:59 2022 +0000 @@ -0,0 +1,1 @@ +NC_045512.2 2940 13 2940 2941 diff -r 000000000000 -r 179342c7b86c test-data/ref.fasta.gz Binary file test-data/ref.fasta.gz has changed diff -r 000000000000 -r 179342c7b86c test-data/variants.vcf.gz Binary file test-data/variants.vcf.gz has changed diff -r 000000000000 -r 179342c7b86c tool_data_table_conf.xml.sample --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/tool_data_table_conf.xml.sample Wed Oct 12 07:43:59 2022 +0000 @@ -0,0 +1,7 @@ + + + + value, dbkey, name, path + +
+
diff -r 000000000000 -r 179342c7b86c tool_data_table_conf.xml.test --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/tool_data_table_conf.xml.test Wed Oct 12 07:43:59 2022 +0000 @@ -0,0 +1,7 @@ + + + + value, dbkey, name, path + +
+
\ No newline at end of file