Mercurial > repos > proteore > proteore_reactome
view reactome_analysis.py @ 4:878128362e33 draft
planemo upload commit 34edf9c3db61650a03d5a0d548b9697a94ecde34-dirty
author | proteore |
---|---|
date | Tue, 03 Apr 2018 08:24:45 -0400 |
parents | 216bd2a75b1d |
children | 9cc475dcd0f2 |
line wrap: on
line source
import os import re import json import argparse CURRENT_DIR = os.path.dirname(os.path.abspath(__file__)) def id_valid(identifiers): """ Validate IDs if they contain special characters """ res = [] remove = [] for id in identifiers: id = id.split(";")[0] if re.match("^[A-Za-z0-9_-]*$", id): res.append(id) else: remove.append(id) return res, remove def isnumber(format, n): """ Check if an variable is numeric """ float_format = re.compile(r"^[-]?[1-9][0-9]*.?[0-9]+$") int_format = re.compile(r"^[-]?[1-9][0-9]*$") test = "" if format == "int": test = re.match(int_format, n) elif format == "float": test = re.match(float_format, n) if test: return True else: return False def data_json(identifiers): """ Submit IDs list to Reactome and return results in json format Return error in HTML format if web service is not available """ trash = [] if identifiers[1] == "list": ids = "\n".join(id_valid(identifiers[0].split())[0]) #print(ids) #print("curl -H \"Content-Type: text/plain\" -d \"$(printf '%s')\" -X POST --url www.reactome.org/AnalysisService/identifiers/projection/\?pageSize\=1\&page\=1" % ids) json_string = os.popen("curl -H \"Content-Type: text/plain\" -d \"$(printf '%s')\" -X POST --url www.reactome.org/AnalysisService/identifiers/projection/\?pageSize\=1\&page\=1" % ids).read() if len(id_valid(identifiers[0].split())[1]) > 0: trash = id_valid(identifiers[0].split())[1] elif identifiers[1] == "file": header = identifiers[2] mq = open(identifiers[0]).readlines() if isnumber("int", identifiers[3].replace("c", "")): if header == "true": idens = [x.split("\t")[int(identifiers[3].replace("c", ""))-1] for x in mq[1:]] else: idens = [x.split("\t")[int(identifiers[3].replace("c", ""))-1] for x in mq] ids = "\n".join(id_valid(idens)[0]) #print(ids) #print("curl -H \"Content-Type: text/plain\" -d \"$(printf '%s')\" -X POST --url www.reactome.org/AnalysisService/identifiers/projection/\?pageSize\=1\&page\=1" % ids) json_string = os.popen("curl -H \"Content-Type: text/plain\" -d \"$(printf '%s')\" -X POST --url www.reactome.org/AnalysisService/identifiers/projection/\?pageSize\=1\&page\=1" % ids).read() if len(id_valid(idens)[1]) > 0: trash = id_valid(idens)[1] print(json_string) return json_string, trash def write_output(filename, json_string, trash_file, trash): """ Replace json result in template and print to output """ template = open(os.path.join(CURRENT_DIR, "template.html")) output = open(filename, "w") try: for line in template: if "{token}" in line: line = line.replace("{token}", json.loads(json_string)["summary"]["token"]) output.write(line) except ValueError: output.write("An error occurred due to unavailability of Reactome web service. Please return later.") template.close() output.close() if trash: print(trash) trash_out = open(trash_file, "w") trash_out.write("\n".join(trash)) trash_out.close() def options(): parser = argparse.ArgumentParser() argument = parser.add_argument("--json", nargs="+", required=True) argument = parser.add_argument("--output", default="output.html") argument = parser.add_argument("--trash", default="trash.txt") args = parser.parse_args() filename = args.output json_string, trash = data_json(args.json) write_output(filename, json_string, args.trash, trash) if __name__ == "__main__": options()