Mercurial > repos > galaxyp > ms_data_converter
diff ms_data_converter.py @ 0:dfafbfd7983d
Uploaded
author | galaxyp |
---|---|
date | Wed, 11 Mar 2015 11:36:26 -0400 |
parents | |
children | a36e9f847308 |
line wrap: on
line diff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/ms_data_converter.py Wed Mar 11 11:36:26 2015 -0400 @@ -0,0 +1,157 @@ +#!/usr/bin/env python +import optparse +import os +import sys +import tempfile +import shutil +import subprocess +import re +import logging + +assert sys.version_info[:2] >= (2, 6) + +log = logging.getLogger(__name__) +working_directory = os.getcwd() +tmp_stderr_name = tempfile.NamedTemporaryFile(dir=working_directory, suffix='.stderr').name +tmp_stdout_name = tempfile.NamedTemporaryFile(dir=working_directory, suffix='.stdout').name + + +def stop_err(msg): + sys.stderr.write("%s\n" % msg) + sys.exit() + + +def read_stderr(): + stderr = '' + if(os.path.exists(tmp_stderr_name)): + with open(tmp_stderr_name, 'rb') as tmp_stderr: + buffsize = 1048576 + try: + while True: + stderr += tmp_stderr.read(buffsize) + if not stderr or len(stderr) % buffsize != 0: + break + except OverflowError: + pass + return stderr + + +def execute(command, stdin=None): + try: + with open(tmp_stderr_name, 'wb') as tmp_stderr: + with open(tmp_stdout_name, 'wb') as tmp_stdout: + proc = subprocess.Popen(args=command, shell=True, stderr=tmp_stderr.fileno(), stdout=tmp_stdout.fileno(), stdin=stdin, env=os.environ) + returncode = proc.wait() + if returncode != 0: + raise Exception("Program returned with non-zero exit code %d. stderr: %s" % (returncode, read_stderr())) + finally: + print(( open(tmp_stderr_name, "r").read() )) + print(( open(tmp_stdout_name, "r").read() )) + + +def delete_file(path): + if os.path.exists(path): + try: + os.remove(path) + except: + pass + + +def delete_directory(directory): + if os.path.exists(directory): + try: + shutil.rmtree(directory) + except: + pass + + +def symlink(source, link_name): + import platform + if platform.system() == 'Windows': + try: + import win32file + win32file.CreateSymbolicLink(source, link_name, 1) + except: + shutil.copy(source, link_name) + else: + os.symlink(source, link_name) + + +def copy_to_working_directory(data_file, relative_path): + if os.path.abspath(data_file) != os.path.abspath(relative_path): + symlink(data_file, relative_path) + return relative_path + + +def __main__(): + run_script() + +#ENDTEMPLATE + +def str_to_bool(v): + """ From http://stackoverflow.com/questions/715417/converting-from-a-string-to-boolean-in-python """ + return v.lower() in ["yes", "true", "t", "1"] + +def shellquote(s): + return '"' + s.replace('"', '\\"') + '"' + +def run_script(): + parser = optparse.OptionParser() + parser.add_option('--input', dest='inputs', action='append', default=[]) + parser.add_option('--input_name', dest='input_names', action='append', default=[]) + parser.add_option('--implicit', dest='implicits', action='append', default=[], help='input files that should NOT be on the AB SCIEX MS Data Converter command line.') + parser.add_option('--output', dest='output') + parser.add_option('--fromextension', dest='fromextension') + parser.add_option('--toextension', dest='toextension', default='mzML', choices=['mzML', 'mgf']) + parser.add_option('--content_type', dest='content_type', default='centroid', choices=['profile', 'centroid', 'proteinpilot']) + parser.add_option('--binaryencoding', dest='binaryencoding', choices=['32', '64']) + parser.add_option('--zlib', dest='zlib', default="false") + parser.add_option('--index', dest='index', default="false") + parser.add_option('--debug', dest='debug', action='store_true', default=False) + + (options, args) = parser.parse_args() + if len(options.inputs) < 1: + stop_err("No input files to ms_data_convert specified") + if len(options.input_names) > 0 and len(options.input_names) != len(options.inputs): + stop_err("Number(s) of supplied input names and input files do not match") + if not options.output: + stop_err("Must specify output location") + input_files = [] + for i, input in enumerate(options.inputs): + input_base = None + if len(options.input_names) > i: + input_base = options.input_names[i] + input_base = input_base.replace("'", "").replace("\"", "") + print("1- input_base: %s" % input_base) + if not input_base: + input_base = 'input%s' % i + print("2- input_base: %s" % input_base) + if not input_base.lower().endswith(options.fromextension.lower()) and input not in options.implicits: + input_file = '%s.%s' % (input_base, options.fromextension) + print("3- input_base: %s" % input_base) + print("3- input_file: %s" % input_file) + else: + input_file = input_base + print("4- input_base: %s" % input_base) + print("4- input_file: %s" % input_file) + input_file = input_file + copy_to_working_directory(input, input_file) + if input not in options.implicits: + input_files.append(input_file) + ## AB_SCIEX_MS_Converter <input format> <input data> <output content type> <output format> <output file> [data compression setting] [data precision setting] [create index flag] + inputs_as_str = " ".join(['%s' % shellquote(input) for input in input_files]) + output_file = re.sub('(%s)?$' % options.fromextension.lower(), options.toextension, input_files[0].lower()) + cmd = "AB_SCIEX_MS_Converter %s %s %s %s %s" % (options.fromextension.upper(), inputs_as_str, options.content_type, options.toextension.upper(), output_file ) + if str_to_bool(options.zlib): + cmd = "%s %s" % (cmd, "/zlib") + if options.binaryencoding: + cmd = "%s %s" % (cmd, "/singleprecision" if options.binaryencoding == '32' else "/doubleprecision") + if str_to_bool(options.zlib): + cmd = "%s %s" % (cmd, "/index") + if options.debug: + print(cmd) + execute(cmd) + shutil.copy(output_file, options.output) + +if __name__ == '__main__': + __main__()