tool_factory_2: rgToolFactory2.py comparison

comparison rgToolFactory2.py @ 15:dd6cf2ddaac7 draft

Uploaded

author	fubar
date	Wed, 28 Jan 2015 19:28:32 -0500
parents	3635f4518c4d
children

comparison

equal deleted inserted replaced

-:3635f4518c4d
+:dd6cf2ddaac7
 # all rights reserved
 # Licensed under the LGPL
 # suggestions for improvement and bug fixes welcome at https://bitbucket.org/fubar/galaxytoolfactory/wiki/Home
 #
 # January 2015
+# unified all setups by passing the script on the cl rather than via a PIPE - no need for treat_bash_special so removed
+#
 # in the process of building a complex tool
 # added ability to choose one of the current toolshed package_r or package_perl or package_python dependencies and source that package
 # add that package to tool_dependencies
 # Note that once the generated tool is loaded, it will have that package's env.sh loaded automagically so there is no
 # --envshpath in the parameters for the generated tool and it uses the system one which will be first on the adjusted path.
 def timenow():
 """return current time as a string
 """
 return time.strftime('%d/%m/%Y %H:%M:%S', time.localtime(time.time()))
+def quote_non_numeric(s):
+"""return a prequoted string for non-numerics
+useful for perl and Rscript parameter passing?
+"""
+try:
+res = float(s)
+return s
+except ValueError:
+return '"%s"' % s
 html_escape_table = {
 "&": "&amp;",
 ">": "&gt;",
 "<": "&lt;",
 "$": "\$"
 else:
 citation_tuples.append( ("bibtex", citation[len("bibtex"):].strip() ) )
 return citation_tuples
 def shell_source(script):
-"""need a way to source a Galaxy tool interpreter env.sh so we can use that dependency
+"""need a way to source a Galaxy tool interpreter env.sh to point at the right dependency package
-package
+This based on the idea in http://pythonwise.blogspot.fr/2010/04/sourcing-shell-script.html
-see http://pythonwise.blogspot.fr/2010/04/sourcing-shell-script.html
+Note that we have to finesse any wierdly quoted newlines in automagic exports using nulls (env -0) as newlines"""
-Sometime you want to emulate the action of "source" in bash,
-settings some environment variables. Here is a way to do it.
-Note that we have to finesse the automagic exports using nulls as newlines for env"""
 pipe = subprocess.Popen("env -i ; . %s ; env -0" % script, stdout=subprocess.PIPE, shell=True)
 output = pipe.communicate()[0]
 outl = output.split('\0')
 outl = [x for x in outl if len(x.split("=")) == 2]
 newenv = dict((line.split("=", 1) for line in outl))
 little overhead...
 """
-def __init__(self,opts=None,treatbashSpecial=True):
+def __init__(self,opts=None):
 """
 cleanup inputs, setup some outputs
 """
 self.useGM = cmd_exists('gm')
 self.useIM = cmd_exists('convert')
 self.useGS = cmd_exists('gs')
 self.temp_warned = False # we want only one warning if $TMP not set
-self.treatbashSpecial = treatbashSpecial
 if opts.output_dir: # simplify for the tool tarball
 os.chdir(opts.output_dir)
 self.thumbformat = 'png'
 self.opts = opts
 self.toolname = re.sub('[^a-zA-Z0-9_]+', '', opts.tool_name) # a sanitizer now does this but..
 psplit = p.split(',')
 param = html_unescape(psplit[0])
 value = html_unescape(psplit[1])
 a('%s="%s"' % (param,value))
 if (self.opts.interpreter == 'Rscript'):
-# pass params on command line
+# pass params on command line as expressions which the script evaluates - see sample
 if self.opts.input_tab:
 a('INPATHS="%s"' % self.infile_paths)
 a('INNAMES="%s"' % self.infile_names)
 if self.opts.output_tab:
 a('OUTPATH="%s"' % self.opts.output_tab)
 for p in opts.additional_parameters:
 p = p.replace('"','')
 psplit = p.split(',')
 param = html_unescape(psplit[0])
 value = html_unescape(psplit[1])
-a('%s="%s"' % (param,value))
+a('%s=%s' % (param,quote_non_numeric(value)))
 if (self.opts.interpreter == 'perl'):
-# pass params on command line
+# pass positional params on command line - perl script needs to discombobulate the path/name lists
 if self.opts.input_tab:
 a('%s' % self.infile_paths)
 a('%s' % self.infile_names)
 if self.opts.output_tab:
 a('%s' % self.opts.output_tab)
 for p in opts.additional_parameters:
+# followed by any additional name=value parameter pairs
 p = p.replace('"','')
 psplit = p.split(',')
 param = html_unescape(psplit[0])
 value = html_unescape(psplit[1])
-if (value.find(' ') <> -1):
+a('%s=%s' % (param,quote_non_numeric(value)))
-a('%s="%s"' % (param,value))
-else:
-a('%s=%s' % (param,value))
 if self.opts.interpreter == 'sh' or self.opts.interpreter == 'bash':
 # more is better - now move all params into environment AND drop on to command line.
 self.cl.insert(0,'env')
 if self.opts.input_tab:
 self.cl.insert(1,'INPATHS=%s' % (self.infile_paths))
 # additional params appear in CL - yes, it's confusing
 for i,p in enumerate(opts.additional_parameters):
 psplit = p.split(',')
 param = html_unescape(psplit[0])
 value = html_unescape(psplit[1])
-if (value.find(' ') <> -1):
+a('%s=%s' % (param,quote_non_numeric(value)))
-a('%s="%s"' % (param,value))
+self.cl.insert(4+i,'%s=%s' % (param,quote_non_numeric(value)))
-self.cl.insert(4+i,'%s="%s"' % (param,value))
+self.interpreter_owner = 'SYSTEM'
-else:
+self.interpreter_pack = 'SYSTEM'
-a('%s=%s' % (param,value))
+self.interpreter_name = 'SYSTEM'
-self.cl.insert(4+i,'%s=%s' % (param,value))
+self.interpreter_version = 'SYSTEM'
-self.interp_owner = None
+self.interpreter_revision = 'SYSTEM'
-self.interp_pack = None
-self.interp_revision = None
-self.interp_version = None
 if opts.envshpath <> 'system': # need to parse out details for our tool_dependency
 try: # fragile - depends on common naming convention as at jan 2015 = package_[interp]_v0_v1_v2... = version v0.v1.v2.. is in play
+# this ONLY happens at tool generation by an admin - the generated tool always uses the default of system so path is from local env.sh
 packdetails = opts.envshpath.split(os.path.sep)[-4:-1]  # eg ['fubar', 'package_r_3_1_1', '63cdb9b2234c']
 self.interpreter_owner = packdetails[0]
 self.interpreter_pack = packdetails[1]
 self.interpreter_name = packdetails[1].split('_')[1].upper()
 self.interpreter_revision = packdetails[2]
 if self.opts.envshpath == 'system':
 tooldepcontent = self.toolhtmldepskel % readme_dict
 else:
 tooldepcontent = self.toolhtmldepinterpskel % readme_dict
 else:
-tooldepcontent = self.emptytoolhtmldepskel  % readme_dictls -l
+tooldepcontent = self.emptytoolhtmldepskel  % readme_dict
 depf = open(os.path.join(tdir,'tool_dependencies.xml'),'w')
 depf.write(tooldepcontent)
 depf.write('\n')
 depf.close()
 testdir = os.path.join(tdir,'test-data')
 def run(self):
 """
-scripts must be small enough not to fill the pipe!
+Some devteam tools have this defensive stderr read so I'm keeping with the faith
+Feel free to update.
 """
 if self.opts.envshpath <> 'system':
 shell_source(self.opts.envshpath)
-if self.treatbashSpecial and self.opts.interpreter in ['bash','sh']:
+# this only happens at tool generation - the generated tool relies on the dependencies all being set up
-retval = self.runBash()
+# at toolshed installation by sourcing local env.sh
-else:
+if self.opts.output_dir:
-if self.opts.output_dir:
+ste = open(self.elog,'wb')
-ste = open(self.elog,'w')
+sto = open(self.tlog,'wb')
-sto = open(self.tlog,'w')
+s = ' '.join(self.cl)
-sto.write('## Toolfactory generated command line = %s\n' % ' '.join(self.cl))
+sto.write('## Executing Toolfactory generated command line = %s\n' % s)
 sto.flush()
 p = subprocess.Popen(self.cl,shell=False,stdout=sto,stderr=ste,cwd=self.opts.output_dir)
-else:
-p = subprocess.Popen(self.cl,shell=False)
 retval = p.wait()
-if self.opts.output_dir:
+sto.close()
-sto.close()
+ste.close()
-ste.close()
+tmp_stderr = open( self.elog, 'rb' )
-err = open(self.elog,'r').readlines()
+err = ''
-if retval <> 0 and err: # problem
+buffsize = 1048576
-print >> sys.stderr,err
+try:
-if self.opts.make_HTML:
+while True:
-self.makeHtml()
+err += tmp_stderr.read( buffsize )
-return retval
+if not err or len( stderr ) % buffsize != 0:
+break
-def runBash(self):
+except OverflowError:
-"""
+pass
-cannot use - for bash so use self.sfile
+tmp_stderr.close()
-"""
+else:
+p = subprocess.Popen(self.cl,shell=False)
+retval = p.wait()
 if self.opts.output_dir:
-s = '## Toolfactory generated command line = %s\n' % ' '.join(self.cl)
+if retval <> 0 and err: # problem
-sto = open(self.tlog,'w')
+print >> sys.stderr,err
-sto.write(s)
-sto.flush()
-p = subprocess.Popen(self.cl,shell=False,stdout=sto,stderr=sto,cwd=self.opts.output_dir)
-else:
-p = subprocess.Popen(self.cl,shell=False)
-retval = p.wait()
-if self.opts.output_dir:
-sto.close()
 if self.opts.make_HTML:
 self.makeHtml()
 return retval
 def main():
 u = """
 This is a Galaxy wrapper. It expects to be called by a special purpose tool.xml as:

Mercurial > repos > fubar > tool_factory_2

comparison rgToolFactory2.py @ 15:dd6cf2ddaac7 draft