# HG changeset patch
# User iuc
# Date 1588975357 14400
# Node ID 25811bd45c44099ada40eea7e87dea85a74a785b
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/data_managers/data_manager_vsnp_excel commit 28873701c097a136c789024151e2fb59fa1091cd"
diff -r 000000000000 -r 25811bd45c44 data_manager/vsnp_excel_fetcher.py
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/data_manager/vsnp_excel_fetcher.py Fri May 08 18:02:37 2020 -0400
@@ -0,0 +1,66 @@
+import argparse
+import json
+import os
+import sys
+try:
+ # For Python 3.0 and later
+ from urllib.request import Request, urlopen
+except ImportError:
+ # Fall back to Python 2 imports
+ from urllib2 import Request, urlopen
+
+
+def url_download(url, workdir):
+ file_path = os.path.abspath(os.path.join(workdir, os.path.basename(url)))
+ src = None
+ dst = None
+ try:
+ req = Request(url)
+ src = urlopen(req)
+ with open(file_path, 'wb') as dst:
+ while True:
+ chunk = src.read(2**10)
+ if chunk:
+ dst.write(chunk)
+ else:
+ break
+ except Exception as e:
+ sys.exit(str(e))
+ finally:
+ if src:
+ src.close()
+ return file_path
+
+
+def download(dbkey, name, url, out_file):
+
+ with open(out_file) as fh:
+ params = json.loads(fh.read())
+
+ workdir = params['output_data'][0]['extra_files_path']
+ os.makedirs(workdir)
+ file_path = url_download(url, workdir)
+ entry_name = os.path.basename(file_path)
+
+ data_manager_json = {"data_tables": {}}
+ data_manager_entry = {}
+ data_manager_entry['value'] = dbkey
+ data_manager_entry['name'] = entry_name
+ data_manager_entry['path'] = file_path
+ data_manager_entry['description'] = "Excel file for %s" % name
+ data_manager_json["data_tables"]["vsnp_excel"] = data_manager_entry
+
+ with open(out_file, 'w') as fh:
+ fh.write(json.dumps(data_manager_json, sort_keys=True))
+
+
+parser = argparse.ArgumentParser()
+
+parser.add_argument('--dbkey', dest='dbkey', help='Genome reference dbkey')
+parser.add_argument('--name', dest='name', help='Reference display name')
+parser.add_argument('--url', dest='url', help='URL to download Excel file')
+parser.add_argument('--out_file', dest='out_file', help='JSON output file')
+
+args = parser.parse_args()
+
+download(args.dbkey, args.name, args.url, args.out_file)
diff -r 000000000000 -r 25811bd45c44 data_manager/vsnp_excel_fetcher.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/data_manager/vsnp_excel_fetcher.xml Fri May 08 18:02:37 2020 -0400
@@ -0,0 +1,103 @@
+
+
+ Download vSNP Excel files
+
+ python
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
diff -r 000000000000 -r 25811bd45c44 data_manager_conf.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/data_manager_conf.xml Fri May 08 18:02:37 2020 -0400
@@ -0,0 +1,21 @@
+
+
+
+
+
+
+
+
+
diff -r 000000000000 -r 25811bd45c44 test-data/AF2122.fa
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/AF2122.fa Fri May 08 18:02:37 2020 -0400
@@ -0,0 +1,11 @@
+>NC_002945.4 Mycobacterium bovis AF2122/97 genome assembly, chromosome: Mycobacterium_bovis_AF2122/97
+TTGACCGATGACCCCGGTTCAGGCTTCACCACAGTGTGGAACGCGGTCGTCTCCGAACTTAACGGCGACC
+CTAAGGTTGACGACGGACCCAGCAGTGATGCTAATCTCAGCGCTCCGCTGACCCCTCAGCAAAGGGCTTG
+GCTCAATCTCGTCCAGCCATTGACCATCGTCGAGGGGTTTGCTCTGTTATCCGTGCCGAGCAGCTTTGTC
+CAAAACGAAATCGAGCGCCATCTGCGGGCCCCGATTACCGACGCTCTCAGCCGCCGACTCGGACATCAGA
+TCCAACTCGGGGTCCGCATCGCTCCGCCGGCGACCGACGAAGCCGACGACACTACCGTGCCGCCTTCCGA
+AAATCCTGCTACCACATCGCCAGACACCACAACCGACAACGACGAGATTGATGACAGCGCTGCGGCACGG
+GGCGATAACCAGCACAGTTGGCCAAGTTACTTCACCGAGCGCCCGCGCAATACCGATTCCGCTACCGCTG
+GCGTAACCAGCCTTAACCGTCGCTACACCTTTGATACGTTCGTTATCGGCGCCTCCAACCGGTTCGCGCA
+CGCCGCCGCCTTGGCGATCGCAGAAGCACCCGCCCGCGCTTACAACCCCCTGTTCATCTGGGGCGAGTCC
+GGTCTCGGCAAGACACACCTGCTACACGCGGCAGGCAACTATGCCCAACGGTTGTTCCCGGGAATGCGGG
diff -r 000000000000 -r 25811bd45c44 test-data/all_fasta.loc
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/all_fasta.loc Fri May 08 18:02:37 2020 -0400
@@ -0,0 +1,19 @@
+#This file lists the locations and dbkeys of all the fasta files
+#under the "genome" directory (a directory that contains a directory
+#for each build). The script extract_fasta.py will generate the file
+#all_fasta.loc. This file has the format (white space characters are
+#TAB characters):
+#
+#
+#
+#So, all_fasta.loc could look something like this:
+#
+#apiMel3 apiMel3 Honeybee (Apis mellifera): apiMel3 /path/to/genome/apiMel3/apiMel3.fa
+#hg19canon hg19 Human (Homo sapiens): hg19 Canonical /path/to/genome/hg19/hg19canon.fa
+#hg19full hg19 Human (Homo sapiens): hg19 Full /path/to/genome/hg19/hg19full.fa
+#
+#Your all_fasta.loc file should contain an entry for each individual
+#fasta file. So there will be multiple fasta files for each build,
+#such as with hg19 above.
+#
+AF2122 AF2122 AF2122 ${__HERE__}/AF2122.fa
diff -r 000000000000 -r 25811bd45c44 test-data/vsnp_excel.json
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/vsnp_excel.json Fri May 08 18:02:37 2020 -0400
@@ -0,0 +1,1 @@
+{"data_tables": {"vsnp_excel": {"description": "Excel file for AF2122", "name": "Mbovis_define_filter.xlsx", "path":
diff -r 000000000000 -r 25811bd45c44 test-data/vsnp_excel.loc
diff -r 000000000000 -r 25811bd45c44 tool-data/all_fasta.loc.sample
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/tool-data/all_fasta.loc.sample Fri May 08 18:02:37 2020 -0400
@@ -0,0 +1,18 @@
+#This file lists the locations and dbkeys of all the fasta files
+#under the "genome" directory (a directory that contains a directory
+#for each build). The script extract_fasta.py will generate the file
+#all_fasta.loc. This file has the format (white space characters are
+#TAB characters):
+#
+#
+#
+#So, all_fasta.loc could look something like this:
+#
+#apiMel3 apiMel3 Honeybee (Apis mellifera): apiMel3 /path/to/genome/apiMel3/apiMel3.fa
+#hg19canon hg19 Human (Homo sapiens): hg19 Canonical /path/to/genome/hg19/hg19canon.fa
+#hg19full hg19 Human (Homo sapiens): hg19 Full /path/to/genome/hg19/hg19full.fa
+#
+#Your all_fasta.loc file should contain an entry for each individual
+#fasta file. So there will be multiple fasta files for each build,
+#such as with hg19 above.
+#
diff -r 000000000000 -r 25811bd45c44 tool-data/vsnp_excel.loc.sample
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/tool-data/vsnp_excel.loc.sample Fri May 08 18:02:37 2020 -0400
@@ -0,0 +1,4 @@
+## vSNP Excel files
+#Value Name Path Description
+#AF2122 Mbovis_define_filter.xlsx vsnp/AF2122/Mbovis_define_filter.xlsx Excel file for Mycobacterium bovis AF2122/97
+#NC_006932 Bab1_define_filter.xlsx vsnp/NC_006932/Bab1_define_filter.xlsx Excel file for Brucella abortus bv. 1 str. 9-941
diff -r 000000000000 -r 25811bd45c44 tool_data_table_conf.xml.sample
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/tool_data_table_conf.xml.sample Fri May 08 18:02:37 2020 -0400
@@ -0,0 +1,13 @@
+
+
+
+ value, dbkey, name, path
+
+
+
+
+ value, name, path, description
+
+
+
+
diff -r 000000000000 -r 25811bd45c44 tool_data_table_conf.xml.test
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/tool_data_table_conf.xml.test Fri May 08 18:02:37 2020 -0400
@@ -0,0 +1,12 @@
+
+
+
+ value, dbkey, name, path
+
+
+
+
+ value, name, path, description
+
+
+