data_manager_mothur_toolsuite: data_manager/fetch_mothur_reference

comparison data_manager/fetch_mothur_reference_data.py @ 1:aec831b54a5b draft

"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/data_managers/data_manager_mothur_toolsuite/ commit 57f71aa633a43ab02bbf05acd0c6d7f406e01f1e"

author	iuc
date	Thu, 28 Nov 2019 15:47:32 -0500
parents	ab7a7e798c34
children	0e532fc0a0a6

comparison

equal deleted inserted replaced

-:ab7a7e798c34
+:aec831b54a5b
 system.
 Returns the name that the file is saved with.
 """
-print "Downloading %s" % url
+print("Downloading %s" % url)
 if not target:
 target = os.path.basename(url)
 if wd:
 target = os.path.join(wd, target)
-print "Saving to %s" % target
+print("Saving to %s" % target)
 open(target, 'wb').write(urllib2.urlopen(url).read())
 return target
 def unpack_zip_archive(filen, wd=None):
 Once all the files are extracted the ZIP archive
 file is deleted from the file system.
 """
 if not zipfile.is_zipfile(filen):
-print "%s: not ZIP formatted file"
+print("%s: not ZIP formatted file")
 return [filen]
 file_list = []
 z = zipfile.ZipFile(filen)
 for name in z.namelist():
 if reduce(lambda x, y: x or name.startswith(y), IGNORE_PATHS, False):
-print "Ignoring %s" % name
+print("Ignoring %s" % name)
 continue
 if wd:
 target = os.path.join(wd, name)
 else:
 target = name
 if name.endswith('/'):
 # Make directory
-print "Creating dir %s" % target
+print("Creating dir %s" % target)
 try:
 os.makedirs(target)
 except OSError:
 pass
 else:
 # Extract file
-print "Extracting %s" % name
+print("Extracting %s" % name)
 try:
 os.makedirs(os.path.dirname(target))
 except OSError:
 pass
 open(target, 'wb').write(z.read(name))
 file_list.append(target)
-print "Removing %s" % filen
+print("Removing %s" % filen)
 os.remove(filen)
 return file_list
 def unpack_tar_archive(filen, wd=None):
 file is deleted from the file system.
 """
 file_list = []
 if not tarfile.is_tarfile(filen):
-print "%s: not TAR file"
+print("%s: not TAR file")
 return [filen]
 t = tarfile.open(filen)
 for name in t.getnames():
 # Check for unwanted files
 if reduce(lambda x, y: x or name.startswith(y), IGNORE_PATHS, False):
-print "Ignoring %s" % name
+print("Ignoring %s" % name)
 continue
 # Extract file
-print "Extracting %s" % name
+print("Extracting %s" % name)
 t.extract(name, wd)
 if wd:
 target = os.path.join(wd, name)
 else:
 target = name
 file_list.append(target)
-print "Removing %s" % filen
+print("Removing %s" % filen)
 os.remove(filen)
 return file_list
 def unpack_archive(filen, wd=None):
 'wd' specifies the working directory to extract
 the files to, otherwise they are extracted to the
 current working directory.
 """
-print "Unpack %s" % filen
+print("Unpack %s" % filen)
 ext = os.path.splitext(filen)[1]
-print "Extension: %s" % ext
+print("Extension: %s" % ext)
 if ext == ".zip":
 return unpack_zip_archive(filen, wd=wd)
 elif ext == ".tgz":
 return unpack_tar_archive(filen, wd=wd)
 else:
 """
 ext = os.path.splitext(filen)[1]
 try:
 return MOTHUR_FILE_TYPES[ext]
 except KeyError:
-print "WARNING: unknown file type for " + filen + ", skipping"
+print("WARNING: unknown file type for " + filen + ", skipping")
 return None
 def get_name(filen):
 """Generate a descriptive name based on the file name
 datasets: a list of dataset names corresponding to keys in
 the MOTHUR_REFERENCE_DATA dictionary
 """
 # Make working dir
 wd = tempfile.mkdtemp(suffix=".mothur", dir=os.getcwd())
-print "Working dir %s" % wd
+print("Working dir %s" % wd)
 # Iterate over all requested reference data URLs
 for dataset in datasets:
-print "Handling dataset '%s'" % dataset
+print("Handling dataset '%s'" % dataset)
 for name in MOTHUR_REFERENCE_DATA[dataset]:
 for f in fetch_files(MOTHUR_REFERENCE_DATA[dataset][name], wd=wd):
 type_ = identify_type(f)
 entry_name = "%s (%s)" % (os.path.splitext(os.path.basename(f))[0], name)
-print "%s\t\'%s'\t.../%s" % (type_, entry_name, os.path.basename(f))
+print("%s\t\'%s'\t.../%s" % (type_, entry_name, os.path.basename(f)))
 if type_ is not None:
 # Move to target dir
 ref_data_file = os.path.basename(f)
 f1 = os.path.join(target_dir, ref_data_file)
-print "Moving %s to %s" % (f, f1)
+print("Moving %s to %s" % (f, f1))
 os.rename(f, f1)
 # Add entry to data table
 table_name = "mothur_%s" % type_
 add_data_table_entry(data_tables, table_name, dict(name=entry_name, value=ref_data_file))
 # Remove working dir
-print "Removing %s" % wd
+print("Removing %s" % wd)
 shutil.rmtree(wd)
 def files_from_filesystem_paths(paths):
 """Return list of file paths from arbitrary input paths
 """
 # Collect files to add
 files = []
 for path in paths:
 path = os.path.abspath(path)
-print "Examining '%s'..." % path
+print("Examining '%s'..." % path)
 if os.path.isfile(path):
 # Store full path for file
 files.append(path)
 elif os.path.isdir(path):
 # Descend into directory and collect the files
 for f in os.listdir(path):
 files.extend(files_from_filesystem_paths((os.path.join(path, f), )))
 else:
-print "Not a file or directory, ignored"
+print("Not a file or directory, ignored")
 return files
 def import_from_server(data_tables, target_dir, paths, description, link_to_data=False):
 """Import reference data from filesystem paths
 files = files_from_filesystem_paths(paths)
 # Handle each file individually
 for f in files:
 type_ = identify_type(f)
 if type_ is None:
-print "%s: unrecognised type, skipped" % f
+print("%s: unrecognised type, skipped" % f)
 continue
 ref_data_file = os.path.basename(f)
 target_file = os.path.join(target_dir, ref_data_file)
 entry_name = "%s" % os.path.splitext(ref_data_file)[0]
 if description:
 entry_name += " (%s)" % description
-print "%s\t\'%s'\t.../%s" % (type_, entry_name, ref_data_file)
+print("%s\t\'%s'\t.../%s" % (type_, entry_name, ref_data_file))
 # Link to or copy the data
 if link_to_data:
 os.symlink(f, target_file)
 else:
 shutil.copyfile(f, target_file)
 table_name = "mothur_%s" % type_
 add_data_table_entry(data_tables, table_name, dict(name=entry_name, value=ref_data_file))
 if __name__ == "__main__":
-print "Starting..."
+print("Starting...")
 # Read command line
 parser = optparse.OptionParser()
 parser.add_option('--source', action='store', dest='data_source')
 parser.add_option('--datasets', action='store', dest='datasets', default='')
 parser.add_option('--paths', action='store', dest='paths', default=[])
 parser.add_option('--description', action='store', dest='description', default='')
 parser.add_option('--link', action='store_true', dest='link_to_data')
 options, args = parser.parse_args()
-print "options: %s" % options
+print("options: %s" % options)
-print "args   : %s" % args
+print("args   : %s" % args)
 # Check for JSON file
 if len(args) != 1:
 sys.stderr.write("Need to supply JSON file name")
 sys.exit(1)
 # Read the input JSON
 params, target_dir = read_input_json(jsonfile)
 # Make the target directory
-print "Making %s" % target_dir
+print("Making %s" % target_dir)
 os.mkdir(target_dir)
 # Set up data tables dictionary
 data_tables = create_data_tables_dict()
 add_data_table(data_tables, 'mothur_lookup')
 # Get list of paths (need to remove any escapes for '\n' and '\r'
 # that might have been inserted by Galaxy)
 paths = options.paths.replace('__cn__', '\n').replace('__cr__', '\r').split()
 import_from_server(data_tables, target_dir, paths, description, link_to_data=options.link_to_data)
 # Write output JSON
-print "Outputting JSON"
+print("Outputting JSON")
-print str(json.dumps(data_tables))
+print(json.dumps(data_tables))
-open(jsonfile, 'wb').write(json.dumps(data_tables))
+open(jsonfile, 'w').write(json.dumps(data_tables, sort_keys=True))
-print "Done."
+print("Done.")

Mercurial > repos > iuc > data_manager_mothur_toolsuite

comparison data_manager/fetch_mothur_reference_data.py @ 1:aec831b54a5b draft