# HG changeset patch
# User iuc
# Date 1652274218 0
# Node ID 7303183cdb87e0798a0d26c8f6e0a07c3b83dd89
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/ensembl_vep commit 2db33cd5bcf5e2d7e3a43f11855c4cfc3b1b9f56
diff -r 000000000000 -r 7303183cdb87 ensembl_vep.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/ensembl_vep.xml Wed May 11 13:03:38 2022 +0000
@@ -0,0 +1,370 @@
+
+ with VEP
+
+ 106.1
+ 106
+
+
+
+
+
+
+
+
+
+
+
+ ensembl-vep
+ perl-math-cdf
+ grep
+
+ 'custom_annotation.${custom_ext}.gz' &&
+ tabix -p gff 'custom_annotation.${custom_ext}.gz' &&
+ #end if
+ vep -i '${annotation_cache.input1}' -o MainOutput.vcf --vcf
+ #if $annotation_cache.source == "custom":
+ --$custom_ext 'custom_annotation.${custom_ext}.gz'
+ #else:
+ --cache
+ --species '${annotation_cache.cache_file.fields.species}'
+ --dir_cache '${annotation_cache.cache_file.fields.path}'
+ #if $annotation_cache.cache_file.fields.cachetype == "refseq": --refseq
+ #if $annotation_cache.cache_file.fields.cachetype == "merged": --merged
+ #if $annotation_cache.cache_file.fields.version != "@DB_VERSION@": --cache_version $annotation_cache.cache_file.fields.version
+ ## The --offline flag automatically activates --cache. This is not wanted in our gff/gtf case but also not needed as no internet connection is required for annotating with these custom annotation sources.
+ --offline
+ #end if
+ #if $ref_seq.ref_source == "cached":
+ --fasta '${ref_seq.ref.fields.path}'
+ #elif $ref_seq.ref_source == "history":
+ --fasta '${ref_seq.ref}'
+ #end if
+ --stats_text
+
+ #if $out_opt.sift != "None": --sift $out_opt.sift
+ #if $out_opt.polyphen != "None": --polyphen $out_opt.polyphen
+ #if $out_opt.nearest != "None": --nearest $out_opt.nearest
+ #if int($out_opt.distance_custom.distance_1) > -1:
+ --distance $out_opt.distance_custom.distance_1#if int($out_opt.distance_custom.distance_2) > -1: ,$out_opt.distance_custom.distance_2
+ #end if
+ #if $out_opt.cell_type != "": --cell_type '$out_opt.cell_type'
+ #if $out_opt.individual != "": --individual $out_opt.individual
+ --vcf_info_field $out_opt.vcf_info_type.vcf_info_field
+ --terms $out_opt.terms
+ #if $out_opt.out_opt_checkboxes != "None": ${' '.join(str($out_opt.out_opt_checkboxes).split(","))}
+ #if $out_opt.shift_var.shift_selector != "None":
+ $out_opt.shift_var.shift_selector
+ #if $out_opt.shift_var.shift_selector == "--shift_hgvs 0 --shift_3prime 1"
+ #if $out_opt.shift_var.shift_length != "None": $out_opt.shift_var.shift_length
+ #end if
+ #end if
+ #if $ident.input_synonyms: --synonyms '${ident.input_synonyms}'
+ #if $ident.ident_checkboxes != "None": ${' '.join(str($ident.ident_checkboxes).split(","))}
+ #if $colo_var.colo_var_checkboxes != "None": ${' '.join(str($colo_var.colo_var_checkboxes).split(","))}
+ #if $fil_qc.fil_qc_checkboxes != "None": ${' '.join(str($fil_qc.fil_qc_checkboxes).split(","))}
+ $plugins.carol
+ $plugins.condel
+ #if $plugins.exacpli_file: --plugin ExACpLI,'${plugins.exacpli_file}'
+ #if $plugins.loftool_file: --plugin LoFtool,'${plugins.loftool_file}'
+ ]]>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ 10.1186/s13059-016-0974-4
+
+
diff -r 000000000000 -r 7303183cdb87 test-data/input_test1.vcf
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/input_test1.vcf Wed May 11 13:03:38 2022 +0000
@@ -0,0 +1,3 @@
+##fileformat=VCFv4.0
+#CHROM POS ID REF ALT QUAL FILTER INFO
+chrM 5701 . GA G . . .
diff -r 000000000000 -r 7303183cdb87 test-data/input_test2.vcf
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/input_test2.vcf Wed May 11 13:03:38 2022 +0000
@@ -0,0 +1,8 @@
+##fileformat=VCFv4.1
+##contig=
+##contig=
+##ALT=
+##INFO=
+##INFO=
+#CHROM POS ID REF ALT QUAL FILTER INFO FORMAT HG00096
+21 5733 rs142513484 C T . . . GT 0|0
diff -r 000000000000 -r 7303183cdb87 test-data/output_test1.vcf
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/output_test1.vcf Wed May 11 13:03:38 2022 +0000
@@ -0,0 +1,5 @@
+##fileformat=VCFv4.0
+##VEP="v105" time="2022-03-07 13:29:51" cache="/home/sebastian/.planemo/planemo_tmp_fhheutk7/test-data/test-cache/drosophila_melanogaster/105_BDGP6.32" db="drosophila_melanogaster_core_105_9@ensembldb.ensembl.org" ensembl-io=105.2a0a40c ensembl-variation=105.ac8178e ensembl=105.525fbcb ensembl-funcgen=105.660df8f assembly="BDGP6.32" genebuild="dmel_r6.32_FB2020_01"
+##INFO=
+#CHROM POS ID REF ALT QUAL FILTER INFO
+chrM 5701 . GA G . . CSQ=-|downstream_gene_variant|MODIFIER|mt:ND2|FBgn0013680|Transcript|FBtr0100857|protein_coding|||||||||||4439|1||FlyBaseName_gene|,-|downstream_gene_variant|MODIFIER|mt:tRNA:Trp-TCA|FBgn0013709|Transcript|FBtr0100858|tRNA|||||||||||4373|1||FlyBaseName_gene|,-|upstream_gene_variant|MODIFIER|mt:tRNA:Cys-GCA|FBgn0013690|Transcript|FBtr0100859|tRNA|||||||||||4319|-1||FlyBaseName_gene|,-|upstream_gene_variant|MODIFIER|mt:tRNA:Tyr-GTA|FBgn0013710|Transcript|FBtr0100860|tRNA|||||||||||4234|-1||FlyBaseName_gene|,-|downstream_gene_variant|MODIFIER|mt:CoI|FBgn0013674|Transcript|FBtr0100861|protein_coding|||||||||||2693|1||FlyBaseName_gene|,-|downstream_gene_variant|MODIFIER|mt:tRNA:Leu-TAA|FBgn0013699|Transcript|FBtr0100862|tRNA|||||||||||2625|1||FlyBaseName_gene|,-|downstream_gene_variant|MODIFIER|mt:CoII|FBgn0013675|Transcript|FBtr0100863|protein_coding|||||||||||1935|1||FlyBaseName_gene|,-|downstream_gene_variant|MODIFIER|mt:tRNA:Lys-CTT|FBgn0013697|Transcript|FBtr0100864|tRNA|||||||||||1864|1||FlyBaseName_gene|,-|downstream_gene_variant|MODIFIER|mt:tRNA:Asp-GTC|FBgn0013691|Transcript|FBtr0100865|tRNA|||||||||||1796|1||FlyBaseName_gene|,-|downstream_gene_variant|MODIFIER|mt:ATPase8|FBgn0013673|Transcript|FBtr0100866|protein_coding|||||||||||1634|1||FlyBaseName_gene|,-|downstream_gene_variant|MODIFIER|mt:CoIII|FBgn0013676|Transcript|FBtr0100868|protein_coding|||||||||||178|1||FlyBaseName_gene|,-|downstream_gene_variant|MODIFIER|mt:tRNA:Gly-TCC|FBgn0013694|Transcript|FBtr0100869|tRNA|||||||||||95|1||FlyBaseName_gene|,-|frameshift_variant|HIGH|mt:ND3|FBgn0013681|Transcript|FBtr0100870|protein_coding|1/1||||95|95|32|D/X|gAc/gc|||1||FlyBaseName_gene|,-|upstream_gene_variant|MODIFIER|mt:tRNA:Ala-TGC|FBgn0013689|Transcript|FBtr0100871|tRNA|||||||||||281|1||FlyBaseName_gene|,-|upstream_gene_variant|MODIFIER|mt:tRNA:Arg-TCG|FBgn0013704|Transcript|FBtr0100872|tRNA|||||||||||360|1||FlyBaseName_gene|,-|upstream_gene_variant|MODIFIER|mt:tRNA:Asn-GTT|FBgn0013701|Transcript|FBtr0100873|tRNA|||||||||||424|1||FlyBaseName_gene|,-|upstream_gene_variant|MODIFIER|mt:tRNA:Ser-GCT|FBgn0013705|Transcript|FBtr0100874|tRNA|||||||||||489|1||FlyBaseName_gene|,-|upstream_gene_variant|MODIFIER|mt:tRNA:Glu-TTC|FBgn0013692|Transcript|FBtr0100875|tRNA|||||||||||557|1||FlyBaseName_gene|,-|downstream_gene_variant|MODIFIER|mt:tRNA:Phe-GAA|FBgn0013693|Transcript|FBtr0100876|tRNA|||||||||||642|-1||FlyBaseName_gene|,-|downstream_gene_variant|MODIFIER|mt:tRNA:His-GTG|FBgn0013695|Transcript|FBtr0100878|tRNA|||||||||||2439|-1||FlyBaseName_gene|,-|downstream_gene_variant|MODIFIER|mt:ND4L|FBgn0013683|Transcript|FBtr0100880|protein_coding|||||||||||3843|-1||FlyBaseName_gene|,-|upstream_gene_variant|MODIFIER|mt:tRNA:Thr-TGT|FBgn0013707|Transcript|FBtr0100881|tRNA|||||||||||4136|1||FlyBaseName_gene|,-|downstream_gene_variant|MODIFIER|mt:tRNA:Pro-TGG|FBgn0013702|Transcript|FBtr0100882|tRNA|||||||||||4202|-1||FlyBaseName_gene|,-|upstream_gene_variant|MODIFIER|mt:ND6|FBgn0013685|Transcript|FBtr0100883|protein_coding|||||||||||4269|1||FlyBaseName_gene|,-|downstream_gene_variant|MODIFIER|mt:ATPase6|FBgn0013672|Transcript|FBtr0433498|protein_coding|||||||||||966|1||FlyBaseName_gene|,-|downstream_gene_variant|MODIFIER|mt:ND4|FBgn0262952|Transcript|FBtr0433500|protein_coding|||||||||||2505|-1||FlyBaseName_gene|,-|downstream_gene_variant|MODIFIER|mt:ND5|FBgn0013684|Transcript|FBtr0433501|protein_coding|||||||||||707|-1||FlyBaseName_gene|,-|upstream_gene_variant|MODIFIER|mt:Cyt-b|FBgn0013678|Transcript|FBtr0433502|protein_coding|||||||||||4797|1||FlyBaseName_gene|
diff -r 000000000000 -r 7303183cdb87 test-data/output_test2.vcf
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/output_test2.vcf Wed May 11 13:03:38 2022 +0000
@@ -0,0 +1,11 @@
+##fileformat=VCFv4.1
+##contig=
+##contig=
+##ALT=
+##INFO=
+##INFO=
+##VEP="v105" time="2022-03-30 19:24:59" ensembl=105.525fbcb ensembl-io=105.2a0a40c ensembl-funcgen=105.660df8f ensembl-variation=105.ac8178e
+##INFO=
+##INFO=
+#CHROM POS ID REF ALT QUAL FILTER INFO FORMAT HG00096
+21 5733 rs142513484 C T . . CSQ=T|3_prime_UTR_variant|MODIFIER|MRPL39|ENSG00000154719|Transcript|ENST00000307301|protein_coding|3/3||||159|||||||-1||||custom_annotation.gtf.gz|,T|missense_variant|MODERATE|MRPL39|ENSG00000154719|Transcript|ENST00000352957|protein_coding|2/2||||70|70|24|A/T|Gca/Aca|||-1||||custom_annotation.gtf.gz|,T|upstream_gene_variant|MODIFIER|AP000223.42|ENSG00000260583|Transcript|ENST00000567517|antisense|||||||||||2407|-1||||custom_annotation.gtf.gz| GT 0|0
diff -r 000000000000 -r 7303183cdb87 test-data/test-cache/drosophila_melanogaster/106_BDGP6.32/chr_synonyms.txt
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/test-cache/drosophila_melanogaster/106_BDGP6.32/chr_synonyms.txt Wed May 11 13:03:38 2022 +0000
@@ -0,0 +1,7 @@
+KJ947872 chrM
+NC_024511.2 chrM
+KJ947872 mitochondrion_genome
+KJ947872.2 chrM
+KJ947872.2 mitochondrion_genome
+NC_024511.2 mitochondrion_genome
+chrM mitochondrion_genome
diff -r 000000000000 -r 7303183cdb87 test-data/test-cache/drosophila_melanogaster/106_BDGP6.32/info.txt
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/test-cache/drosophila_melanogaster/106_BDGP6.32/info.txt Wed May 11 13:03:38 2022 +0000
@@ -0,0 +1,6 @@
+species drosophila_melanogaster
+assembly BDGP6.32
+sift
+polyphen
+source_genebuild dmel_r6.32_FB2020_01
+source_assembly BDGP6.32
diff -r 000000000000 -r 7303183cdb87 test-data/test-cache/drosophila_melanogaster/106_BDGP6.32/mitochondrion_genome/1-1000000.gz
Binary file test-data/test-cache/drosophila_melanogaster/106_BDGP6.32/mitochondrion_genome/1-1000000.gz has changed
diff -r 000000000000 -r 7303183cdb87 test-data/test.fa
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/test.fa Wed May 11 13:03:38 2022 +0000
@@ -0,0 +1,168 @@
+>21 dna:chromosome chromosome:GRCh38:21:1:10000:1 REF
+CCACAATCATTTTAGGAGAATGGGTTTAAGAAAGGAAAAAAAAAAAAAAGATTTCTGTAT
+GCTCTTAAGAGAAAATCTAAAAAATAATGACATGAAAAAGTTGAAAGGAATGGAAAAATA
+TGTACCATTAAAAGGAAACCCGACGTATGAATGCCATTATCAGACAAAACAGATTTTTTT
+CTTTTTGAGATGGAGTCTCACTCTGTGGCCCAGGCTGGAGTGCAGTGGCACAATCTCTGC
+TCACAGCAAGCTCCGCCTCCCAGGTTCATGCCATTCTCCTGCCTCAGCCTCCCAAGTAGC
+TGGGACTACAGGCACCCACCACCACACCAGGCTAGTATTTGTATTTTTAGTAGAGACGGG
+GTTTCATCGTGTTAGCCAGGATGGTCTCAATCTTCTGACCTCGTGATCTGCCCACCTCAG
+CCTCCCAAAGTGCTGGGATTACAGGCATGAGCCACCGCGCCCAGCCAGACAAAACAGATT
+TTAAGACAACTAAGAAGTTAACAAGCTGACCCTACAATAAGCATGAAAATTTTGAAAAAG
+AATAGGAAAGGAGAACTCACCATAAGAGAAATTGAAACTTGTTATAAAGCTATAGTTGTT
+AAAACGGTGTTACTACAGTGGTACATGGACAGATAAATGGACCAATGAAGCAGACCCAGG
+CACTGAAAGGAACCTTTTATATGACAGCATGGCACAATCAGTAAGAATAGAGAGGAAATA
+GGCCAGGCACGGTGGCTCACGCCTGTAATCCCAGTACTTTGGGAGGCCAAGGCAGGCAGA
+TCACCTGAGGTCAGGAGTTCGAGACCAGCCTGGTCAACATGGTGAAACCGCGTCTCTACT
+AAAAATACAAAAATTAGCTGGTCGTGGTGGCAGGCACCTGTAATCCCAGCTACTCGGGAG
+GCTGAGGCAGGAGAATCACTTGAACCCGGCTAGCGGAGGCTGCAGTGAGCCGAGATCACG
+CCATTGCACTCCAGCCTAGGCAACAAGAGTGAAACTCCATCACAAAAAAAAAAGAAAAAG
+AGTAGACAGGAAATAAATGGTCCAGAATAACTGCCTATCCTTGTGGAGGAGAGGGTGATT
+CAAAATTAGGTCCCTTTCCTCACTCTATATGCAAAAAACAAACTTCAAATAAATTATACA
+ATTAAATGTGAAAATCAAGACTTTAAAATAAACAATGCAGTAGGCTGCTTTATAATATCA
+AGTTAGGGAAGGCTTTCTTAAATTTCATAAACATAAATCATAGAGGAAAAGATGAACTGT
+CTACCTTAAAATTAAAGACGATATAAACAAAATTAAAAGGTAAGCCAGACAAAAGAAATA
+TTTGTAGTGACAACGGTTTAACTTTCTTTCTTTCTTTTTTTTTTTTTGAGACGGAATCTC
+ACTCTGTCACCCAGGCTGGAGTACACTGGTGCAATCTCAGCTCACTGCAACCTCCACCTC
+CCAGGTTCAAGCGATTCTTGTGCCTCAGCCTCCCAAGTAGCTGGGATGACAGGTACGCAC
+CACCACACCCAGCTAATTTTTTGTATTTTTAGCAGAGACGGGGTTTCACCATGTTGGCCA
+GGCTGGTCTCGAATTCCTGACCTCAGGTGATCCATCTGCCTCAGCCTCCCAAAGTGCTGG
+GATTACAGGAGTGAGCCACTGCACCTGGCCCACAAGGGTTTCACTTTCTAAAAATATAAA
+GAACTGGCCAGGTGCAATGGCTCACACTTGTAATCCTAGCACTTTGGGAGGGCAAGGAGA
+GCAGATCGCTAGAGGCCAGAAGCTGGAGAACAGCCTGGCCAACATGGTGAAACCCCATCT
+CTACTTTAAAAATATAAAAATTAGTTGGGTGTGGTGGCACTTGCCTATAATCCCAGCTAC
+TTGGCTACTCAGGAGGCCGAGGCAGGGGAATCGCTTGAATCCAGTAGGCAGAGGCTACAG
+TGAGCCAAGATCATGCCACTGCACTACAGCTTGGGCAACAGAGTGAGACTTGGTCTCAAA
+AAAAAAAAAAATTATATATATATATCTTATATATATACACTATTATATATATACACACAC
+ACACACACACACACACACACACACACACACACAATTAATATGAGATGCCCAAAAATCCAA
+TTGTAAAAAGGGGCAAAGGTTGTAAACTGGTAATTCATAAAAACAAATGAAGAGATGCTT
+ATTGGTACTATATGCTCAGTATTAAGCAAATTAAATGAGATAGGATCGTGCATATTCAAC
+CAACAAAATATCTGAATGTCTGAAAATAATAAATGTTAATGAGGGAGTGGAGAAAATGGG
+AATGCTCATACTGCTGATAGAGAGTAAACTGGTACAACTATTGTGGCAGCCAATTAATAT
+TTAGTAAAGCTGAAGATGCATGGTCCACTGTGGTACAGGCCCTGGAGATATTATCAAATG
+TGTACACAAAGAAACACGCACAAGGATATTTTCTGCGATACTGTAATACTCAAAAGCCAA
+TGACATCCTCAGTGGTCATCAATAAGAAAATGAATTAATGATGGGATTAATCATATAATG
+AAATACTATATAGCAGTTGAAATGAATGTACTCTTTACATGTATCAACATGCTATACATA
+AAAAACAATGATGAGCAATAAAAGCAAATTGCAAAAGGATATATATTATGAAACCAATTA
+TGTTTAGTTTTAAAACACAGAGAATACTATGGATTGTAGTAAAAAAAAATATAAAATCAT
+GAAGAGTAAGGACAGGTACAAACAGGATAGTGGTTCTTCTTGAGAGGAAGGAAATGACAT
+AACAAGACCTTCAATGGATGTGCAGCTTTTCCTTTATTTAAACACAAAAGGATCTGAAGG
+AAATAAGGAAAAAGGTTGACAGTGGTTACAATTAAATAGTGGCTGTATGTCAACACTCTT
+GGTTACAAACAACAGGATCTACACTAGCTAGTTTAAACAAACAGAATAAAATGGCTCACA
+AGTCACAGGCGTGGAGGTCAGGACTACGGAGCCCCCAAAAATGCCCATTTTTATACCTTG
+GAGCAGCTGCGGGGGAAAAACTGCTAAGCAAAGCCTCCACACCTTGCACCATTACATGGG
+ACCTCTGCCACTGCTGCCTTGAAAACCACATCACTGCTCCGTTCAACAAAATGTATCTCA
+TACTACTCTTGTCTGCAAAGTACTTGCTTCCAGATTTCACACAGTTATGTCTAATTGGTG
+AGCCCATGCTACCTGTCTGAGCCACAGCTGCAAGGAAGGGCAGGAGATTAAATTTCATTC
+TTCTACTGGGTAAGGCGAGATCCACAGAGTGGGAAGTTGCCAAAAAGCAGGTGTTCAAAC
+AGTGCTAGCTGCCCAAAAAGCACGAAAAGTGCCCACTCAAACAAGAGTTGGTGAAAATAT
+TCTCTCTACTTTTCTGTATGCTCAAATATTTCACAATTTTTTTAAAGAAAAAATGTCGAA
+GTATGTAAATTCACAAACAACAAAGGGAATGGAAAAAAAATCAATAAACAAGAGACGTCA
+ACCAAATTCTAAAAGACAAAAAGCTAAGTGACTAATAAAACACTAGAGAATGTCACCACC
+TAGAAAACATGTGGAGGAAGTTCCATCAGAGGCAGCCAACCGGCCCAGCTGGGCCTTAGC
+TCAGAGGCAGCAAAAGTTCATAGATGATAGAAGACAGTAGAGGGATTAGTTAAATCTAAA
+CTAATTAAAAAGAAAGGAATTAATTAAAGGTCTGTATACAAACTGGTTGAACACTACCCC
+ATCTTCAAATATAGAAGGGCCTAAATCCAGGAAGTGCCCCATGCAAAATATTGAAGGGAT
+CTTTATTATAAAGTAAGTGAAAGAACAGTCTGGGTAAAACTAGGATAGTCAATTTAGAAA
+TCGGTAGCCAAGACAAGACCTCTTCATTCTAGCATTTTAAAAACCCTCATCCTACCAGCC
+AGATTTACCTACTTATCCTTAGTGATGCTTATGAGAAGCCAAACCTTCCTCAAACCACAG
+AGCTGCCACTCAACCTCCCTACATCCACATCTTCAACTACAAACTGACAGCCAACAAACG
+TAAGACATTTGAAAAAAGCCTGAAACATGTAGATGAAAGACTAAGAAAAAAATCTGTCAC
+TGGAGAAAAGAGATGATTCAGGGACTAGAAAGTGAATGAAGAAATGAATAAAAATTATAT
+TGATATCTTCAGAGAGCTTCATGAAAATACTTCACATCCAGAAAACATGAAAAGGATTCT
+ATGAAACAGAAGCAAAAGAGAGCTTTCAGAAATTAAAATATGCTTGACATAATGTGAGTA
+AAATATAAATGCAGGAAAAATAATAGAGAAAGGGAAAAAAATACAGAGGACCAATACAGA
+CGATGCAAATACAGCTGAAAGGTATTAGAGAAACAAAGAACCTCCAGAGAAAAGAAAGAA
+CAAATAAAGTAAAAAAACATAAAAGAGAGATGTCAAAAATTGAAAGGATCGCCTACGTAC
+CAAGCAGAATAACTGACTGAAGACCTAGATACAGGTACAGGATTGTCGAATTTTACAACA
+CCAAGAATAATAAGATCCTAAGTGTCCAGAGTGTGTTGAGAGAAGGGGATGCAGAGAACA
+GGTTATATAAAAAAGGAACAAGAATCAGACTGGCATCAGACCTTTCATTAGCAAAATCAG
+ATGCCAGAAAATAACTGAGCTGCTTTCAAAGTTCTAAGAGAAAACTACTTTTCAATCTAG
+AATTCTGTATCTAGCTGAATAGTTCATCAAATGTAAGCGCATAACCCACTTTAGACATGC
+AATGGCTCACCTCTTAGACATTTTTTCCTAGAAAGGAGCTTAGAGACAAATGCTAGCAAA
+ATGAGAAAGTTAATCAAGAAACAGGAAGATATGGACTCTAAGAAAAAGTTGACCTCACCC
+AGAAAAAAAAAAAAAAAAATACGGCCTTCAGAGGAAGCCTGTGCACAAGATGCAGAAAAC
+TTGCTGACAAAGAAGCAGAAACTTTTTGGCAAAATATTTTTGTAAGACTGATAACCAAGG
+CTTACTCAAGGTGTGGGGAAACAGGCACTCTTAGACAGTTATTGGGAGTAACACTTGGCA
+AAACCTTTGGGAAGCCAGCATCTGGTAGCACCTGACAGTAATTCCACTGCCAGAAATCTA
+TTTCTACAGAATTATTTATACGTGAGGCAACATAGAGTAGAACATAAGAGCATGTGAGTG
+AAACTACCTCCGTTCAAATTCCCACTTTACCACTTTCAAGCTCTATGCTGTTTCCTCATT
+TAAAAAATAGAAACATCTTCTCAACAGGTCACTATGAGGATTATAGAAAAGGTTCCACAC
+GTGATGGGCTTCGCACAAGACCCAGCACATGATAAATACTCAGTTAATATTACTTATCTA
+CAAACATTTGCCATTTTTGCACAAGGATGTTTACTGTGCCACTGTTCGGCAAAAAACGCA
+AGCAAGTATAGTATGGTCCTATTTATGTTTTTTAGAAATTACATTTATATTTGTATGTAT
+CTGCCTAGATCTGTAGGAAAAAATAGAGAAAACATGCTAAAGTGTTGCATCCATGGAGCA
+GGAAGGGAGTGACCTGTTTTTGTACAGTTTTTACTTAAGCAACATGAAGTGTTTCATACT
+TTAGAGAAAAGAAAAAGTAAAGATCACTATCAATCTTGGGGAGAAAGGGTTAATCTGTAT
+AAGCACACACAAACATTATATTTAAAACATTTATTTTATTATACATATTTAAATTTTAGA
+AAGTTATTAGGTAGATGTACATTCCTCTGTTGCTTTACTTTGATCTTCAGTTACCTGTAA
+AAACATGAATAGCTTTACTTTCCTAATAAACACTTTCAGTTTTACCCTTCACCCACCATT
+TTAAATCATTCCACAGCCCTCTTATAATGACCCTTTATCTTTCCCCTTAAATAGTAGAAT
+AGAAAGTTAGGTAAGAAGAAAGATTTAAAGGCCAAGTAACCAATATAAATTATCAGGTAA
+AGAACAATAATTCCATTCAAAAATATAATCTAAGGCATATTATACCTAGGCTTCTCAAGT
+TGGCCATTTTACTTTTCAGCCGTAAAACAAAATCATTAGTGTAAGAAAAAACACCTGAAG
+TGCTGTAACAAGCTATTTTAAATCAGTTTATTTTCTTTTGGAGTATAATTCCATTTAGAA
+TAGAACATATTACAGATTTAGTCTAAATAGATATCTCTATGTCCCTATTTCTATTCTGTG
+TCACTCAGACTCATCAAACAGACATGGCTAAATCTGAATTCAACACCCCAAAACCTGTCC
+TACCTGCATCATCTATCTTGGTAAAGGGCTCCACCCAGATACCTAAGGACAGCATTCAAG
+AATTCACTCTCTTCTTCCTACCTGCATATTCCATCAACAGTCCTACTAATTCAGCCTAAG
+TTAACTCTCACAGTCATTCTCCCTATCGCGGCTGAACTTTAGGACCTCATTCTCTTCTAT
+CCCCCTAACAGAACTCTTGGCTTAAGTCACAGCTATATCCCATGCTACCCCTAGAATGAG
+CTTTTAAACAAGAATAGCTGATCAACAGGTCACTTCCCTACTCAAAATTCTCCAGTTACT
+CTCTAGCATCTCAGTGGGGTGGAGGAGGAAAGTCAGGAATGCAAGTTCCACAACACGGGA
+CACAAGCCCCTCATATTCTGTTTTTGGACTGACTCTTTACCTATCCTACATGTGACCTGT
+ACATTCAAATTCATCTTACATTCATCATGTTCTCTATGTAGGCAAGTGACTTCCTCTGAG
+ATAACCTCCAACCCATTTTCCAACAGATTATCTGCATGGTCCACTTTTATTCACCCTTTA
+AAATCAGCTTAAGAGACTCCAATTCCTGGAAGCCTTCCTTAAGCAACTCCCCAGCTTGGT
+CTGAGTCCTCTTCTTTATGCCAGAGCCCCACATGTACACCTGAACTGTCTGCTTATAAGT
+CTAATTATCCAATCAACATTACTTCCCTGAGGCAGCAAGTAAATTTTGTGCATTTTTTTG
+TACCTCCAGACCATAACAGTACCTGGCACACAATAAACAATCAGTAAGTCTGTGTTGCAT
+CAATGAACCACGTTTAATCTAATCCCTTCAGAAAAGCAAAATGGACAGTAGAAAAAAGCA
+ACTAAACCAGAATAAATGTTTGAAAAAATATGTATTGACTAACATCACTAGATATTCTAG
+GTAAGACACTGTCTCTGCCGTTTTTCTACATTTTTCATTCCTTTAAAGTGTTCAGTTACT
+ACTGCTTCTTTAATTTTCCAAACTATTTCTTTAATATTCTTTAGCTTTTTAAATTTTTTT
+TAATTTTACTTAACTCCAAGTAAACATGCTGAACATTTTTTCTTTAGTTTCTTCATCTAA
+AATGATCACTGTGACCAACTAAAAAGAGAAAATTACTCCATCCATTCAAAGGTAATTTCT
+TCTCATGAGAAAAAAAATTATATAACCCTTACTCAAGAACATTATGGTGAAGTCCCTAAA
+CAATAATTCCTATCTACATAGTCATTAATAAAGACTAGGTTTATATATCATTATGAAAAA
+TTGTCAATAAATATTTCTTGGGTAACCCCTTCATGTGCTAATGTTGTGTTCAAAATTTGG
+GCTTACACAAATATAACAAATCCTGAAAGGCTTAACAGACAGAAAATAAATGTACTGGCA
+AAGAAAACAATCAAAAAATAGTATGTGGACATATACAATCAAGCACAAACTTATATGAAT
+AATTATTTGTTAGAGATTACTCTGAGACTGTTCCATGGAGGAGGTACGACTCAGGCGAGG
+TAGTGAAGAATGACTGCGTAGTAAATAGAAGGAGAATGGGAAATGGAGTCTAGAAAGAAA
+AACTATCATGAAGAAATAAGCAAACTTGAAAATAAGTTTAATGTGTGATGCTTAATGTGC
+CTGCAAGCTTAACCAGTGTTTGTGGCATTGTGGGAAATTAGGATAAGGAGGAAGTCCTAA
+TGAGGACAGATTACACAGGACAGCTATCAGATAACCTAAGTAAAAGAGGCACACTTAGCC
+TATGAAATAGGAAACAGGAATAGTTGTGGTCAAGAAATACAATCACCCGGGCCGGGCGCG
+GTGGCTCACGCCTGTAATCCCAGCACCTTGGGAGGCTGAGGGGGGTGGATCACGAGGTCA
+GGAGATCGAGACCATCCTGGCTAACACGGTAAAACCCTGTCTCTACTAAAAATACAAAAA
+AATTAGTTGGACGTAGTGGTGGGCACCCATAGTCCCAGCTACTTGGGAGGCTGAGGCACG
+AGAATCGCTTGAGCCCGGGAGGTGGAGGTTGCAGTGAGCTGAGATCGCGCCACTGCACTC
+CAGCCTGGGAGACAGAACAAGACTCTGTCTCAAAAAAAAAAAGAAAAGAAATACTATCAT
+TCCTACTCATTAAGTCTAAATGCTAATGACAAAGAATAAACTACAAAAACACAAACATTC
+AAATCTGGTTTTTCAGGACATTAGGATATTTGCACATTTACTGTTAATGGCTAAAGGCGG
+CTTTAAAATACACCTGACAAATCTTAATCCTCTAAATATTCATTAAGTTTACAAAATAAA
+TCCTAAGACCTAACTGATACCATTACAACTATTAAGAACTATTACTATTACATAGTAATA
+TTCTTATTTCTCTTCAAGTTCTACAATATCATTTTCACGATATTAACAAATAAAATCAAA
+AGAGAACTGCCAAGTTACAACTTTACCCTTACCAACACACTAGTGAACAATCACAACACT
+GCTTTGACTATTGAGACAACTTACTTTTTTCCTTTCTCTTTGTTTCTTTCATTTTTCCCC
+CCTTTGGTTGTTATTGGTTAATTTTGATGAATTTCTTTATAGAAGAGTACTCAATAGCTG
+TCAAAAACACTTACCATTTTCCGAGATCTTTCCAATAGCTTATCCCATATTGTAAAATGT
+GCCTTGAAAAGAAAAGATTTGCGATGAACTAAATGAAGCAGTAATGTCAAAGTAAAAAGG
+ACAGAGTCTTTATATAGCTTTTAGAACAAAATAAATAAAAAGCTAGGCAGTACTAATTTA
+GATAAGTGGTTATAAAAGTGGATCATAGTAGCAAAAAAAGGTGCTACATGGGGATAGCTG
+CTTTTTTGCTTTCTTCAATCGCATGAACCCGGGAGGCAGAGGTTGCAGTGAGCATTTAAG
+AAAAAAACGCTTAAGGATTGAACGTGCCCTTCTTTCACTTTTGCCCATCTTAATCATTTC
+CATCATAGAAAGCATTTCTTCTAATAGGAAGCAAAAATCTGCCCTACTTTCCCATAGACT
+GTGGTTCAATCCTTAAACAGCCAGTTTCAACATTCTAGAAGTCATTCTTCAAATCATAAG
+CAATCACAAGAAGACAGTCATTAAAAACCAACTGTGACATCTTCACACTGAAATGGCAGA
+AGCAGAGGATTCATCAAGTTACCCTAAAGAATAAGTAAAACCTAACAAAGACAATAGTAA
+ATTTTTTTTTTTTTTGAAATGGAGTTTCACTCTGTCGCCCAGGCTGGAGTGCAGTGGTGC
+GATCTCAGCTCACTGCAACCTCCGCCTCCCAGGTTCAAGCAATTCTCCTGCCTCAGCCTC
+CCAAGACAATAGTAAAATTTAAACTCAATTTCCTTAGTCCATAACAACCTCCTGTAGCAG
+AGGATTATCAGAATGCATTAAAGAAAACTGTGCAAAGTGTATCATGACCACATCAATTTT
+ATTAGGTCAACTGAAAGTGGTAACAAGACATATGGGCAGGCCAGTGACTACTCCACACTG
+AATGAGCTCATAAAATCTATAATAAAAGGTAAAATTAATAAATATCAACATACAAACCCT
+TCCAGGGAAAGAGCTGACTGGTATGTTTAAAGGGAAAACCATGCCTGACTCAGGCGGAAT
+GAACTGCTGGTGCAGAGACCTTAAGCTGTGGCTGGAATATAGTGAGTGAGGAAAGGAGTG
+GTGTTAGATAAAGTCAGAGAAGCAGGCAGGGACCAGATAATGCAGGGCTTTGTGAGACAG
+GGTAAAGAGTTGGGATTTGTTCAAGGGAAGCCATTGGAAA
diff -r 000000000000 -r 7303183cdb87 test-data/test.gtf
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/test.gtf Wed May 11 13:03:38 2022 +0000
@@ -0,0 +1,20 @@
+21 havana exon 2770 3326 . - . gene_id "ENSG00000260583"; gene_version "1"; transcript_id "ENST00000567517"; transcript_version "1"; exon_number "1"; gene_name "AP000223.42"; gene_source "havana"; gene_biotype "antisense"; havana_gene "OTTHUMG00000172769"; havana_gene_version "1"; transcript_name "AP000223.42-001"; transcript_source "havana"; transcript_biotype "antisense"; havana_transcript "OTTHUMT00000420390"; havana_transcript_version "1"; exon_id "ENSE00002629631"; exon_version "1"; tag "basic"; transcript_support_level "NA";
+21 havana gene 2770 3326 . - . gene_id "ENSG00000260583"; gene_version "1"; gene_name "AP000223.42"; gene_source "havana"; gene_biotype "antisense"; havana_gene "OTTHUMG00000172769"; havana_gene_version "1";
+21 havana transcript 2770 3326 . - . gene_id "ENSG00000260583"; gene_version "1"; transcript_id "ENST00000567517"; transcript_version "1"; gene_name "AP000223.42"; gene_source "havana"; gene_biotype "antisense"; havana_gene "OTTHUMG00000172769"; havana_gene_version "1"; transcript_name "AP000223.42-001"; transcript_source "havana"; transcript_biotype "antisense"; havana_transcript "OTTHUMT00000420390"; havana_transcript_version "1"; tag "basic"; transcript_support_level "NA";
+21 ensembl_havana three_prime_utr 5656 5706 . - . gene_id "ENSG00000154719"; gene_version "13"; transcript_id "ENST00000352957"; transcript_version "8"; gene_name "MRPL39"; gene_source "ensembl_havana"; gene_biotype "protein_coding"; havana_gene "OTTHUMG00000078371"; havana_gene_version "4"; transcript_name "MRPL39-001"; transcript_source "ensembl_havana"; transcript_biotype "protein_coding"; tag "CCDS"; ccds_id "CCDS13573"; havana_transcript "OTTHUMT00000171194"; havana_transcript_version "1"; tag "basic"; transcript_support_level "1";
+21 ensembl_havana three_prime_utr 5656 5750 . - . gene_id "ENSG00000154719"; gene_version "13"; transcript_id "ENST00000307301"; transcript_version "11"; gene_name "MRPL39"; gene_source "ensembl_havana"; gene_biotype "protein_coding"; havana_gene "OTTHUMG00000078371"; havana_gene_version "4"; transcript_name "MRPL39-002"; transcript_source "ensembl_havana"; transcript_biotype "protein_coding"; tag "CCDS"; ccds_id "CCDS33522"; havana_transcript "OTTHUMT00000171195"; havana_transcript_version "2"; tag "basic"; transcript_support_level "5";
+21 ensembl_havana exon 5656 5754 . - . gene_id "ENSG00000154719"; gene_version "13"; transcript_id "ENST00000307301"; transcript_version "11"; exon_number "11"; gene_name "MRPL39"; gene_source "ensembl_havana"; gene_biotype "protein_coding"; havana_gene "OTTHUMG00000078371"; havana_gene_version "4"; transcript_name "MRPL39-002"; transcript_source "ensembl_havana"; transcript_biotype "protein_coding"; tag "CCDS"; ccds_id "CCDS33522"; havana_transcript "OTTHUMT00000171195"; havana_transcript_version "2"; exon_id "ENSE00003528074"; exon_version "1"; tag "basic"; transcript_support_level "5";
+21 ensembl_havana exon 5656 5754 . - . gene_id "ENSG00000154719"; gene_version "13"; transcript_id "ENST00000352957"; transcript_version "8"; exon_number "10"; gene_name "MRPL39"; gene_source "ensembl_havana"; gene_biotype "protein_coding"; havana_gene "OTTHUMG00000078371"; havana_gene_version "4"; transcript_name "MRPL39-001"; transcript_source "ensembl_havana"; transcript_biotype "protein_coding"; tag "CCDS"; ccds_id "CCDS13573"; havana_transcript "OTTHUMT00000171194"; havana_transcript_version "1"; exon_id "ENSE00003605259"; exon_version "1"; tag "basic"; transcript_support_level "1";
+21 ensembl_havana gene 5656 27517 . - . gene_id "ENSG00000154719"; gene_version "13"; gene_name "MRPL39"; gene_source "ensembl_havana"; gene_biotype "protein_coding"; havana_gene "OTTHUMG00000078371"; havana_gene_version "4";
+21 ensembl_havana transcript 5656 27517 . - . gene_id "ENSG00000154719"; gene_version "13"; transcript_id "ENST00000307301"; transcript_version "11"; gene_name "MRPL39"; gene_source "ensembl_havana"; gene_biotype "protein_coding"; havana_gene "OTTHUMG00000078371"; havana_gene_version "4"; transcript_name "MRPL39-002"; transcript_source "ensembl_havana"; transcript_biotype "protein_coding"; tag "CCDS"; ccds_id "CCDS33522"; havana_transcript "OTTHUMT00000171195"; havana_transcript_version "2"; tag "basic"; transcript_support_level "5";
+21 ensembl_havana transcript 5656 27517 . - . gene_id "ENSG00000154719"; gene_version "13"; transcript_id "ENST00000352957"; transcript_version "8"; gene_name "MRPL39"; gene_source "ensembl_havana"; gene_biotype "protein_coding"; havana_gene "OTTHUMG00000078371"; havana_gene_version "4"; transcript_name "MRPL39-001"; transcript_source "ensembl_havana"; transcript_biotype "protein_coding"; tag "CCDS"; ccds_id "CCDS13573"; havana_transcript "OTTHUMT00000171194"; havana_transcript_version "1"; tag "basic"; transcript_support_level "1";
+21 ensembl_havana stop_codon 5707 5709 . - 0 gene_id "ENSG00000154719"; gene_version "13"; transcript_id "ENST00000352957"; transcript_version "8"; exon_number "10"; gene_name "MRPL39"; gene_source "ensembl_havana"; gene_biotype "protein_coding"; havana_gene "OTTHUMG00000078371"; havana_gene_version "4"; transcript_name "MRPL39-001"; transcript_source "ensembl_havana"; transcript_biotype "protein_coding"; tag "CCDS"; ccds_id "CCDS13573"; havana_transcript "OTTHUMT00000171194"; havana_transcript_version "1"; tag "basic"; transcript_support_level "1";
+21 ensembl_havana CDS 5710 5754 . - 0 gene_id "ENSG00000154719"; gene_version "13"; transcript_id "ENST00000352957"; transcript_version "8"; exon_number "10"; gene_name "MRPL39"; gene_source "ensembl_havana"; gene_biotype "protein_coding"; havana_gene "OTTHUMG00000078371"; havana_gene_version "4"; transcript_name "MRPL39-001"; transcript_source "ensembl_havana"; transcript_biotype "protein_coding"; tag "CCDS"; ccds_id "CCDS13573"; havana_transcript "OTTHUMT00000171194"; havana_transcript_version "1"; protein_id "ENSP00000284967"; protein_version "6"; tag "basic"; transcript_support_level "1";
+21 ensembl_havana stop_codon 5751 5753 . - 0 gene_id "ENSG00000154719"; gene_version "13"; transcript_id "ENST00000307301"; transcript_version "11"; exon_number "11"; gene_name "MRPL39"; gene_source "ensembl_havana"; gene_biotype "protein_coding"; havana_gene "OTTHUMG00000078371"; havana_gene_version "4"; transcript_name "MRPL39-002"; transcript_source "ensembl_havana"; transcript_biotype "protein_coding"; tag "CCDS"; ccds_id "CCDS33522"; havana_transcript "OTTHUMT00000171195"; havana_transcript_version "2"; tag "basic"; transcript_support_level "5";
+21 ensembl_havana CDS 5754 5754 . - 1 gene_id "ENSG00000154719"; gene_version "13"; transcript_id "ENST00000307301"; transcript_version "11"; exon_number "11"; gene_name "MRPL39"; gene_source "ensembl_havana"; gene_biotype "protein_coding"; havana_gene "OTTHUMG00000078371"; havana_gene_version "4"; transcript_name "MRPL39-002"; transcript_source "ensembl_havana"; transcript_biotype "protein_coding"; tag "CCDS"; ccds_id "CCDS33522"; havana_transcript "OTTHUMT00000171195"; havana_transcript_version "2"; protein_id "ENSP00000305682"; protein_version "7"; tag "basic"; transcript_support_level "5";
+21 ensembl_havana CDS 7701 7789 . - 0 gene_id "ENSG00000154719"; gene_version "13"; transcript_id "ENST00000307301"; transcript_version "11"; exon_number "10"; gene_name "MRPL39"; gene_source "ensembl_havana"; gene_biotype "protein_coding"; havana_gene "OTTHUMG00000078371"; havana_gene_version "4"; transcript_name "MRPL39-002"; transcript_source "ensembl_havana"; transcript_biotype "protein_coding"; tag "CCDS"; ccds_id "CCDS33522"; havana_transcript "OTTHUMT00000171195"; havana_transcript_version "2"; protein_id "ENSP00000305682"; protein_version "7"; tag "basic"; transcript_support_level "5";
+21 ensembl_havana exon 7701 7789 . - . gene_id "ENSG00000154719"; gene_version "13"; transcript_id "ENST00000307301"; transcript_version "11"; exon_number "10"; gene_name "MRPL39"; gene_source "ensembl_havana"; gene_biotype "protein_coding"; havana_gene "OTTHUMG00000078371"; havana_gene_version "4"; transcript_name "MRPL39-002"; transcript_source "ensembl_havana"; transcript_biotype "protein_coding"; tag "CCDS"; ccds_id "CCDS33522"; havana_transcript "OTTHUMT00000171195"; havana_transcript_version "2"; exon_id "ENSE00001149457"; exon_version "5"; tag "basic"; transcript_support_level "5";
+21 ensembl_havana CDS 8835 8882 . - 0 gene_id "ENSG00000154719"; gene_version "13"; transcript_id "ENST00000307301"; transcript_version "11"; exon_number "9"; gene_name "MRPL39"; gene_source "ensembl_havana"; gene_biotype "protein_coding"; havana_gene "OTTHUMG00000078371"; havana_gene_version "4"; transcript_name "MRPL39-002"; transcript_source "ensembl_havana"; transcript_biotype "protein_coding"; tag "CCDS"; ccds_id "CCDS33522"; havana_transcript "OTTHUMT00000171195"; havana_transcript_version "2"; protein_id "ENSP00000305682"; protein_version "7"; tag "basic"; transcript_support_level "5";
+21 ensembl_havana CDS 8835 8882 . - 0 gene_id "ENSG00000154719"; gene_version "13"; transcript_id "ENST00000352957"; transcript_version "8"; exon_number "9"; gene_name "MRPL39"; gene_source "ensembl_havana"; gene_biotype "protein_coding"; havana_gene "OTTHUMG00000078371"; havana_gene_version "4"; transcript_name "MRPL39-001"; transcript_source "ensembl_havana"; transcript_biotype "protein_coding"; tag "CCDS"; ccds_id "CCDS13573"; havana_transcript "OTTHUMT00000171194"; havana_transcript_version "1"; protein_id "ENSP00000284967"; protein_version "6"; tag "basic"; transcript_support_level "1";
+21 ensembl_havana exon 8835 8882 . - . gene_id "ENSG00000154719"; gene_version "13"; transcript_id "ENST00000307301"; transcript_version "11"; exon_number "9"; gene_name "MRPL39"; gene_source "ensembl_havana"; gene_biotype "protein_coding"; havana_gene "OTTHUMG00000078371"; havana_gene_version "4"; transcript_name "MRPL39-002"; transcript_source "ensembl_havana"; transcript_biotype "protein_coding"; tag "CCDS"; ccds_id "CCDS33522"; havana_transcript "OTTHUMT00000171195"; havana_transcript_version "2"; exon_id "ENSE00001017286"; exon_version "1"; tag "basic"; transcript_support_level "5";
+21 ensembl_havana exon 8835 8882 . - . gene_id "ENSG00000154719"; gene_version "13"; transcript_id "ENST00000352957"; transcript_version "8"; exon_number "9"; gene_name "MRPL39"; gene_source "ensembl_havana"; gene_biotype "protein_coding"; havana_gene "OTTHUMG00000078371"; havana_gene_version "4"; transcript_name "MRPL39-001"; transcript_source "ensembl_havana"; transcript_biotype "protein_coding"; tag "CCDS"; ccds_id "CCDS13573"; havana_transcript "OTTHUMT00000171194"; havana_transcript_version "1"; exon_id "ENSE00001017286"; exon_version "1"; tag "basic"; transcript_support_level "1";
diff -r 000000000000 -r 7303183cdb87 test-data/vep_versioned_annotation_cache.loc
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/vep_versioned_annotation_cache.loc Wed May 11 13:03:38 2022 +0000
@@ -0,0 +1,3 @@
+#
+#
+drosophila_melanogaster_vep_106_BDGP6.32 dm6 106 default Drosophila melanogaster dm6 (V106) drosophila_melanogaster ${__HERE__}/test-cache
diff -r 000000000000 -r 7303183cdb87 tool-data/dbkeys.loc.sample
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/tool-data/dbkeys.loc.sample Wed May 11 13:03:38 2022 +0000
@@ -0,0 +1,1 @@
+#
\ No newline at end of file
diff -r 000000000000 -r 7303183cdb87 tool-data/vep_versioned_annotation_cache.loc.sample
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/tool-data/vep_versioned_annotation_cache.loc.sample Wed May 11 13:03:38 2022 +0000
@@ -0,0 +1,11 @@
+#This file describes vep cache data and its metadata available on the server.
+#The data table has the format (white space characters are TAB characters):
+#
+#
+#
+#So, vep_versioned_annotation_cache.loc tables could look like this:
+#
+#homo_sapiens_vep_105_GRCh38 hg38 105 default Homo sapiens hg38 (V105) homo_sapiens /path/to/vep_versioned_annotation_cache/105/hg38/default
+#homo_sapiens_refseq_vep_105_GRCh38 hg38 105 refseq Homo sapiens hg38 (V105, Refseq) homo_sapiens /path/to/vep_versioned_annotation_cache/105/hg38/refseq
+#homo_sapiens_merged_vep_105_GRCh38 hg38 105 merged Homo sapiens hg38 (V105, Merged) homo_sapiens /path/to/vep_versioned_annotation_cache/105/hg38/merged
+#
\ No newline at end of file
diff -r 000000000000 -r 7303183cdb87 tool_data_table_conf.xml.sample
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/tool_data_table_conf.xml.sample Wed May 11 13:03:38 2022 +0000
@@ -0,0 +1,12 @@
+
+
+
+ value, dbkey, version, cachetype, name, species, path
+
+
+
+
+ value, name, len_path
+
+
+
\ No newline at end of file
diff -r 000000000000 -r 7303183cdb87 tool_data_table_conf.xml.test
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/tool_data_table_conf.xml.test Wed May 11 13:03:38 2022 +0000
@@ -0,0 +1,7 @@
+
+
+
+ value, dbkey, version, cachetype, name, species, path
+
+
+
\ No newline at end of file