annotate Marea/marea.py @ 47:3af9d394367c draft

Uploaded
author bimib
date Wed, 19 Feb 2020 10:44:52 -0500
parents 7b1971251c63
children e4235b5231e4
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
1 from __future__ import division
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
2 import sys
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
3 import pandas as pd
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
4 import itertools as it
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
5 import scipy.stats as st
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
6 import collections
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
7 import lxml.etree as ET
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
8 import pickle as pk
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
9 import math
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
10 import os
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
11 import argparse
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
12 from svglib.svglib import svg2rlg
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
13 from reportlab.graphics import renderPDF
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
14
16
c71ac0bb12de Uploaded
bimib
parents: 13
diff changeset
15 ########################## argparse ##########################################
0
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
16
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
17 def process_args(args):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
18 parser = argparse.ArgumentParser(usage = '%(prog)s [options]',
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
19 description = 'process some value\'s'+
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
20 ' genes to create a comparison\'s map.')
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
21 parser.add_argument('-rs', '--rules_selector',
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
22 type = str,
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
23 default = 'HMRcore',
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
24 choices = ['HMRcore', 'Recon', 'Custom'],
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
25 help = 'chose which type of dataset you want use')
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
26 parser.add_argument('-cr', '--custom',
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
27 type = str,
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
28 help='your dataset if you want custom rules')
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
29 parser.add_argument('-n', '--none',
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
30 type = str,
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
31 default = 'true',
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
32 choices = ['true', 'false'],
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
33 help = 'compute Nan values')
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
34 parser.add_argument('-pv' ,'--pValue',
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
35 type = float,
47
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
36 default = 0.1,
0
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
37 help = 'P-Value threshold (default: %(default)s)')
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
38 parser.add_argument('-fc', '--fChange',
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
39 type = float,
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
40 default = 1.5,
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
41 help = 'Fold-Change threshold (default: %(default)s)')
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
42 parser.add_argument('-td', '--tool_dir',
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
43 type = str,
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
44 required = True,
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
45 help = 'your tool directory')
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
46 parser.add_argument('-op', '--option',
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
47 type = str,
47
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
48 choices = ['datasets', 'dataset_class'],
0
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
49 help='dataset or dataset and class')
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
50 parser.add_argument('-ol', '--out_log',
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
51 help = "Output log")
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
52 parser.add_argument('-id', '--input_data',
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
53 type = str,
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
54 help = 'input dataset')
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
55 parser.add_argument('-ic', '--input_class',
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
56 type = str,
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
57 help = 'sample group specification')
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
58 parser.add_argument('-cm', '--custom_map',
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
59 type = str,
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
60 help = 'custom map')
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
61 parser.add_argument('-yn', '--yes_no',
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
62 type = str,
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
63 choices = ['yes', 'no'],
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
64 help = 'if make or not custom map')
16
c71ac0bb12de Uploaded
bimib
parents: 13
diff changeset
65 parser.add_argument('-gs', '--generate_svg',
c71ac0bb12de Uploaded
bimib
parents: 13
diff changeset
66 type = str,
c71ac0bb12de Uploaded
bimib
parents: 13
diff changeset
67 default = 'true',
c71ac0bb12de Uploaded
bimib
parents: 13
diff changeset
68 choices = ['true', 'false'],
c71ac0bb12de Uploaded
bimib
parents: 13
diff changeset
69 help = 'generate svg map')
c71ac0bb12de Uploaded
bimib
parents: 13
diff changeset
70 parser.add_argument('-gp', '--generate_pdf',
c71ac0bb12de Uploaded
bimib
parents: 13
diff changeset
71 type = str,
c71ac0bb12de Uploaded
bimib
parents: 13
diff changeset
72 default = 'true',
c71ac0bb12de Uploaded
bimib
parents: 13
diff changeset
73 choices = ['true', 'false'],
c71ac0bb12de Uploaded
bimib
parents: 13
diff changeset
74 help = 'generate pdf map')
47
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
75 parser.add_argument('-on', '--control',
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
76 type = str)
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
77 parser.add_argument('-co', '--comparison',
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
78 type = str,
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
79 default = '1vs1',
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
80 choices = ['manyvsmany', 'onevsrest', 'onevsmany'])
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
81 parser.add_argument('-ids', '--input_datas',
16
c71ac0bb12de Uploaded
bimib
parents: 13
diff changeset
82 type = str,
47
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
83 nargs = '+',
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
84 help = 'input datasets')
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
85 parser.add_argument('-na', '--names',
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
86 type = str,
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
87 nargs = '+',
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
88 help = 'input names')
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
89
0
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
90 args = parser.parse_args()
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
91 return args
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
92
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
93 ########################### warning ###########################################
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
94
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
95 def warning(s):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
96 args = process_args(sys.argv)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
97 with open(args.out_log, 'a') as log:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
98 log.write(s)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
99
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
100 ############################ dataset input ####################################
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
101
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
102 def read_dataset(data, name):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
103 try:
16
c71ac0bb12de Uploaded
bimib
parents: 13
diff changeset
104 dataset = pd.read_csv(data, sep = '\t', header = 0, engine='python')
0
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
105 except pd.errors.EmptyDataError:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
106 sys.exit('Execution aborted: wrong format of ' + name + '\n')
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
107 if len(dataset.columns) < 2:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
108 sys.exit('Execution aborted: wrong format of ' + name + '\n')
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
109 return dataset
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
110
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
111 ############################ dataset name #####################################
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
112
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
113 def name_dataset(name_data, count):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
114 if str(name_data) == 'Dataset':
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
115 return str(name_data) + '_' + str(count)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
116 else:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
117 return str(name_data)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
118
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
119 ############################ load id e rules ##################################
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
120
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
121 def load_id_rules(reactions):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
122 ids, rules = [], []
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
123 for key, value in reactions.items():
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
124 ids.append(key)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
125 rules.append(value)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
126 return (ids, rules)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
127
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
128 ############################ check_methods ####################################
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
129
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
130 def gene_type(l, name):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
131 if check_hgnc(l):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
132 return 'hugo_id'
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
133 elif check_ensembl(l):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
134 return 'ensembl_gene_id'
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
135 elif check_symbol(l):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
136 return 'symbol'
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
137 elif check_entrez(l):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
138 return 'entrez_id'
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
139 else:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
140 sys.exit('Execution aborted:\n' +
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
141 'gene ID type in ' + name + ' not supported. Supported ID'+
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
142 'types are: HUGO ID, Ensemble ID, HUGO symbol, Entrez ID\n')
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
143
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
144 def check_hgnc(l):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
145 if len(l) > 5:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
146 if (l.upper()).startswith('HGNC:'):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
147 return l[5:].isdigit()
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
148 else:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
149 return False
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
150 else:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
151 return False
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
152
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
153 def check_ensembl(l):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
154 if len(l) == 15:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
155 if (l.upper()).startswith('ENS'):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
156 return l[4:].isdigit()
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
157 else:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
158 return False
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
159 else:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
160 return False
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
161
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
162 def check_symbol(l):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
163 if len(l) > 0:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
164 if l[0].isalpha() and l[1:].isalnum():
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
165 return True
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
166 else:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
167 return False
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
168 else:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
169 return False
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
170
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
171 def check_entrez(l):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
172 if len(l) > 0:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
173 return l.isdigit()
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
174 else:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
175 return False
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
176
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
177 def check_bool(b):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
178 if b == 'true':
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
179 return True
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
180 elif b == 'false':
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
181 return False
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
182
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
183 ############################ resolve_methods ##################################
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
184
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
185 def replace_gene_value(l, d):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
186 tmp = []
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
187 err = []
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
188 while l:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
189 if isinstance(l[0], list):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
190 tmp_rules, tmp_err = replace_gene_value(l[0], d)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
191 tmp.append(tmp_rules)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
192 err.extend(tmp_err)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
193 else:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
194 value = replace_gene(l[0], d)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
195 tmp.append(value)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
196 if value == None:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
197 err.append(l[0])
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
198 l = l[1:]
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
199 return (tmp, err)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
200
35
7b1971251c63 Uploaded
bimib
parents: 34
diff changeset
201
0
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
202 def replace_gene(l, d):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
203 if l =='and' or l == 'or':
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
204 return l
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
205 else:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
206 value = d.get(l, None)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
207 if not(value == None or isinstance(value, (int, float))):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
208 sys.exit('Execution aborted: ' + value + ' value not valid\n')
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
209 return value
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
210
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
211 def computes(val1, op, val2, cn):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
212 if val1 != None and val2 != None:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
213 if op == 'and':
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
214 return min(val1, val2)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
215 else:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
216 return val1 + val2
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
217 elif op == 'and':
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
218 if cn is True:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
219 if val1 != None:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
220 return val1
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
221 elif val2 != None:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
222 return val2
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
223 else:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
224 return None
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
225 else:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
226 return None
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
227 else:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
228 if val1 != None:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
229 return val1
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
230 elif val2 != None:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
231 return val2
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
232 else:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
233 return None
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
234
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
235 def control(ris, l, cn):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
236 if len(l) == 1:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
237 if isinstance(l[0], (float, int)) or l[0] == None:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
238 return l[0]
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
239 elif isinstance(l[0], list):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
240 return control(None, l[0], cn)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
241 else:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
242 return False
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
243 elif len(l) > 2:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
244 return control_list(ris, l, cn)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
245 else:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
246 return False
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
247
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
248 def control_list(ris, l, cn):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
249 while l:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
250 if len(l) == 1:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
251 return False
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
252 elif (isinstance(l[0], (float, int)) or
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
253 l[0] == None) and l[1] in ['and', 'or']:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
254 if isinstance(l[2], (float, int)) or l[2] == None:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
255 ris = computes(l[0], l[1], l[2], cn)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
256 elif isinstance(l[2], list):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
257 tmp = control(None, l[2], cn)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
258 if tmp is False:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
259 return False
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
260 else:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
261 ris = computes(l[0], l[1], tmp, cn)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
262 else:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
263 return False
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
264 l = l[3:]
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
265 elif l[0] in ['and', 'or']:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
266 if isinstance(l[1], (float, int)) or l[1] == None:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
267 ris = computes(ris, l[0], l[1], cn)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
268 elif isinstance(l[1], list):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
269 tmp = control(None,l[1], cn)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
270 if tmp is False:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
271 return False
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
272 else:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
273 ris = computes(ris, l[0], tmp, cn)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
274 else:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
275 return False
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
276 l = l[2:]
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
277 elif isinstance(l[0], list) and l[1] in ['and', 'or']:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
278 if isinstance(l[2], (float, int)) or l[2] == None:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
279 tmp = control(None, l[0], cn)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
280 if tmp is False:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
281 return False
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
282 else:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
283 ris = computes(tmp, l[1], l[2], cn)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
284 elif isinstance(l[2], list):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
285 tmp = control(None, l[0], cn)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
286 tmp2 = control(None, l[2], cn)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
287 if tmp is False or tmp2 is False:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
288 return False
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
289 else:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
290 ris = computes(tmp, l[1], tmp2, cn)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
291 else:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
292 return False
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
293 l = l[3:]
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
294 else:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
295 return False
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
296 return ris
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
297
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
298 ############################ map_methods ######################################
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
299
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
300 def fold_change(avg1, avg2):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
301 if avg1 == 0 and avg2 == 0:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
302 return 0
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
303 elif avg1 == 0:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
304 return '-INF'
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
305 elif avg2 == 0:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
306 return 'INF'
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
307 else:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
308 return math.log(avg1 / avg2, 2)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
309
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
310 def fix_style(l, col, width, dash):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
311 tmp = l.split(';')
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
312 flag_col = False
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
313 flag_width = False
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
314 flag_dash = False
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
315 for i in range(len(tmp)):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
316 if tmp[i].startswith('stroke:'):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
317 tmp[i] = 'stroke:' + col
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
318 flag_col = True
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
319 if tmp[i].startswith('stroke-width:'):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
320 tmp[i] = 'stroke-width:' + width
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
321 flag_width = True
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
322 if tmp[i].startswith('stroke-dasharray:'):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
323 tmp[i] = 'stroke-dasharray:' + dash
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
324 flag_dash = True
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
325 if not flag_col:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
326 tmp.append('stroke:' + col)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
327 if not flag_width:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
328 tmp.append('stroke-width:' + width)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
329 if not flag_dash:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
330 tmp.append('stroke-dasharray:' + dash)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
331 return ';'.join(tmp)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
332
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
333 def fix_map(d, core_map, threshold_P_V, threshold_F_C, max_F_C):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
334 maxT = 12
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
335 minT = 2
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
336 grey = '#BEBEBE'
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
337 blue = '#0000FF'
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
338 red = '#E41A1C'
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
339 for el in core_map.iter():
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
340 el_id = str(el.get('id'))
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
341 if el_id.startswith('R_'):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
342 tmp = d.get(el_id[2:])
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
343 if tmp != None:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
344 p_val = tmp[0]
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
345 f_c = tmp[1]
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
346 if p_val < threshold_P_V:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
347 if not isinstance(f_c, str):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
348 if abs(f_c) < math.log(threshold_F_C, 2):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
349 col = grey
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
350 width = str(minT)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
351 else:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
352 if f_c < 0:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
353 col = blue
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
354 elif f_c > 0:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
355 col = red
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
356 width = str(max((abs(f_c) * maxT) / max_F_C, minT))
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
357 else:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
358 if f_c == '-INF':
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
359 col = blue
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
360 elif f_c == 'INF':
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
361 col = red
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
362 width = str(maxT)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
363 dash = 'none'
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
364 else:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
365 dash = '5,5'
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
366 col = grey
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
367 width = str(minT)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
368 el.set('style', fix_style(el.get('style'), col, width, dash))
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
369 return core_map
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
370
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
371 ############################ make recon #######################################
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
372
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
373 def check_and_doWord(l):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
374 tmp = []
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
375 tmp_genes = []
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
376 count = 0
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
377 while l:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
378 if count >= 0:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
379 if l[0] == '(':
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
380 count += 1
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
381 tmp.append(l[0])
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
382 l.pop(0)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
383 elif l[0] == ')':
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
384 count -= 1
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
385 tmp.append(l[0])
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
386 l.pop(0)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
387 elif l[0] == ' ':
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
388 l.pop(0)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
389 else:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
390 word = []
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
391 while l:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
392 if l[0] in [' ', '(', ')']:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
393 break
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
394 else:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
395 word.append(l[0])
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
396 l.pop(0)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
397 word = ''.join(word)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
398 tmp.append(word)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
399 if not(word in ['or', 'and']):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
400 tmp_genes.append(word)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
401 else:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
402 return False
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
403 if count == 0:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
404 return (tmp, tmp_genes)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
405 else:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
406 return False
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
407
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
408 def brackets_to_list(l):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
409 tmp = []
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
410 while l:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
411 if l[0] == '(':
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
412 l.pop(0)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
413 tmp.append(resolve_brackets(l))
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
414 else:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
415 tmp.append(l[0])
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
416 l.pop(0)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
417 return tmp
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
418
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
419 def resolve_brackets(l):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
420 tmp = []
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
421 while l[0] != ')':
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
422 if l[0] == '(':
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
423 l.pop(0)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
424 tmp.append(resolve_brackets(l))
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
425 else:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
426 tmp.append(l[0])
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
427 l.pop(0)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
428 l.pop(0)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
429 return tmp
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
430
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
431 def priorityAND(l):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
432 tmp = []
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
433 flag = True
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
434 while l:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
435 if len(l) == 1:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
436 if isinstance(l[0], list):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
437 tmp.append(priorityAND(l[0]))
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
438 else:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
439 tmp.append(l[0])
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
440 l = l[1:]
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
441 elif l[0] == 'or':
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
442 tmp.append(l[0])
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
443 flag = False
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
444 l = l[1:]
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
445 elif l[1] == 'or':
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
446 if isinstance(l[0], list):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
447 tmp.append(priorityAND(l[0]))
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
448 else:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
449 tmp.append(l[0])
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
450 tmp.append(l[1])
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
451 flag = False
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
452 l = l[2:]
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
453 elif l[1] == 'and':
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
454 tmpAnd = []
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
455 if isinstance(l[0], list):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
456 tmpAnd.append(priorityAND(l[0]))
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
457 else:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
458 tmpAnd.append(l[0])
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
459 tmpAnd.append(l[1])
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
460 if isinstance(l[2], list):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
461 tmpAnd.append(priorityAND(l[2]))
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
462 else:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
463 tmpAnd.append(l[2])
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
464 l = l[3:]
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
465 while l:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
466 if l[0] == 'and':
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
467 tmpAnd.append(l[0])
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
468 if isinstance(l[1], list):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
469 tmpAnd.append(priorityAND(l[1]))
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
470 else:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
471 tmpAnd.append(l[1])
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
472 l = l[2:]
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
473 elif l[0] == 'or':
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
474 flag = False
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
475 break
13
e96f3b85e5a0 Uploaded
bimib
parents: 12
diff changeset
476 if flag == True: #when there are only AND in list
0
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
477 tmp.extend(tmpAnd)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
478 elif flag == False:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
479 tmp.append(tmpAnd)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
480 return tmp
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
481
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
482 def checkRule(l):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
483 if len(l) == 1:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
484 if isinstance(l[0], list):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
485 if checkRule(l[0]) is False:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
486 return False
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
487 elif len(l) > 2:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
488 if checkRule2(l) is False:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
489 return False
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
490 else:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
491 return False
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
492 return True
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
493
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
494 def checkRule2(l):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
495 while l:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
496 if len(l) == 1:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
497 return False
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
498 elif isinstance(l[0], list) and l[1] in ['and', 'or']:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
499 if checkRule(l[0]) is False:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
500 return False
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
501 if isinstance(l[2], list):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
502 if checkRule(l[2]) is False:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
503 return False
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
504 l = l[3:]
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
505 elif l[1] in ['and', 'or']:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
506 if isinstance(l[2], list):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
507 if checkRule(l[2]) is False:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
508 return False
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
509 l = l[3:]
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
510 elif l[0] in ['and', 'or']:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
511 if isinstance(l[1], list):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
512 if checkRule(l[1]) is False:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
513 return False
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
514 l = l[2:]
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
515 else:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
516 return False
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
517 return True
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
518
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
519 def do_rules(rules):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
520 split_rules = []
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
521 err_rules = []
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
522 tmp_gene_in_rule = []
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
523 for i in range(len(rules)):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
524 tmp = list(rules[i])
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
525 if tmp:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
526 tmp, tmp_genes = check_and_doWord(tmp)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
527 tmp_gene_in_rule.extend(tmp_genes)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
528 if tmp is False:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
529 split_rules.append([])
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
530 err_rules.append(rules[i])
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
531 else:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
532 tmp = brackets_to_list(tmp)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
533 if checkRule(tmp):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
534 split_rules.append(priorityAND(tmp))
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
535 else:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
536 split_rules.append([])
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
537 err_rules.append(rules[i])
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
538 else:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
539 split_rules.append([])
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
540 if err_rules:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
541 warning('Warning: wrong format rule in ' + str(err_rules) + '\n')
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
542 return (split_rules, list(set(tmp_gene_in_rule)))
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
543
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
544 def make_recon(data):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
545 try:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
546 import cobra as cb
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
547 import warnings
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
548 with warnings.catch_warnings():
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
549 warnings.simplefilter('ignore')
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
550 recon = cb.io.read_sbml_model(data)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
551 react = recon.reactions
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
552 rules = [react[i].gene_reaction_rule for i in range(len(react))]
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
553 ids = [react[i].id for i in range(len(react))]
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
554 except cb.io.sbml3.CobraSBMLError:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
555 try:
16
c71ac0bb12de Uploaded
bimib
parents: 13
diff changeset
556 data = (pd.read_csv(data, sep = '\t', dtype = str, engine='python')).fillna('')
0
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
557 if len(data.columns) < 2:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
558 sys.exit('Execution aborted: wrong format of '+
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
559 'custom datarules\n')
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
560 if not len(data.columns) == 2:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
561 warning('Warning: more than 2 columns in custom datarules.\n' +
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
562 'Extra columns have been disregarded\n')
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
563 ids = list(data.iloc[:, 0])
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
564 rules = list(data.iloc[:, 1])
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
565 except pd.errors.EmptyDataError:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
566 sys.exit('Execution aborted: wrong format of custom datarules\n')
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
567 except pd.errors.ParserError:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
568 sys.exit('Execution aborted: wrong format of custom datarules\n')
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
569 split_rules, tmp_genes = do_rules(rules)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
570 gene_in_rule = {}
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
571 for i in tmp_genes:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
572 gene_in_rule[i] = 'ok'
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
573 return (ids, split_rules, gene_in_rule)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
574
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
575 ############################ gene #############################################
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
576
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
577 def data_gene(gene, type_gene, name, gene_custom):
35
7b1971251c63 Uploaded
bimib
parents: 34
diff changeset
578 args = process_args(sys.argv)
0
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
579 for i in range(len(gene)):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
580 tmp = gene.iloc[i, 0]
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
581 if tmp.startswith(' ') or tmp.endswith(' '):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
582 gene.iloc[i, 0] = (tmp.lstrip()).rstrip()
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
583 gene_dup = [item for item, count in
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
584 collections.Counter(gene[gene.columns[0]]).items() if count > 1]
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
585 pat_dup = [item for item, count in
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
586 collections.Counter(list(gene.columns)).items() if count > 1]
35
7b1971251c63 Uploaded
bimib
parents: 34
diff changeset
587
0
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
588 if gene_dup:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
589 if gene_custom == None:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
590 if args.rules_selector == 'HMRcore':
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
591 gene_in_rule = pk.load(open(args.tool_dir +
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
592 '/local/HMRcore_genes.p', 'rb'))
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
593 elif args.rules_selector == 'Recon':
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
594 gene_in_rule = pk.load(open(args.tool_dir +
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
595 '/local/Recon_genes.p', 'rb'))
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
596 gene_in_rule = gene_in_rule.get(type_gene)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
597 else:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
598 gene_in_rule = gene_custom
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
599 tmp = []
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
600 for i in gene_dup:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
601 if gene_in_rule.get(i) == 'ok':
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
602 tmp.append(i)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
603 if tmp:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
604 sys.exit('Execution aborted because gene ID '
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
605 +str(tmp)+' in '+name+' is duplicated\n')
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
606 if pat_dup:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
607 warning('Warning: duplicated label\n' + str(pat_dup) + 'in ' + name +
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
608 '\n')
35
7b1971251c63 Uploaded
bimib
parents: 34
diff changeset
609
0
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
610 return (gene.set_index(gene.columns[0])).to_dict()
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
611
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
612 ############################ resolve ##########################################
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
613
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
614 def resolve(genes, rules, ids, resolve_none, name):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
615 resolve_rules = {}
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
616 not_found = []
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
617 flag = False
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
618 for key, value in genes.items():
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
619 tmp_resolve = []
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
620 for i in range(len(rules)):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
621 tmp = rules[i]
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
622 if tmp:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
623 tmp, err = replace_gene_value(tmp, value)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
624 if err:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
625 not_found.extend(err)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
626 ris = control(None, tmp, resolve_none)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
627 if ris is False or ris == None:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
628 tmp_resolve.append(None)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
629 else:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
630 tmp_resolve.append(ris)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
631 flag = True
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
632 else:
35
7b1971251c63 Uploaded
bimib
parents: 34
diff changeset
633 tmp_resolve.append(None)
0
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
634 resolve_rules[key] = tmp_resolve
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
635 if flag is False:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
636 warning('Warning: no computable score (due to missing gene values)' +
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
637 'for class ' + name + ', the class has been disregarded\n')
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
638 return (None, None)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
639 return (resolve_rules, list(set(not_found)))
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
640
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
641 ############################ split class ######################################
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
642
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
643 def split_class(classes, resolve_rules):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
644 class_pat = {}
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
645 for i in range(len(classes)):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
646 classe = classes.iloc[i, 1]
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
647 if not pd.isnull(classe):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
648 l = []
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
649 for j in range(i, len(classes)):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
650 if classes.iloc[j, 1] == classe:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
651 pat_id = classes.iloc[j, 0]
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
652 tmp = resolve_rules.get(pat_id, None)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
653 if tmp != None:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
654 l.append(tmp)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
655 classes.iloc[j, 1] = None
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
656 if l:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
657 class_pat[classe] = list(map(list, zip(*l)))
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
658 else:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
659 warning('Warning: no sample found in class ' + classe +
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
660 ', the class has been disregarded\n')
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
661 return class_pat
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
662
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
663 ############################ map ##############################################
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
664
47
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
665 def maps(core_map, class_pat, ids, threshold_P_V, threshold_F_C, create_svg, create_pdf, comparison, control):
0
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
666 args = process_args(sys.argv)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
667 if (not class_pat) or (len(class_pat.keys()) < 2):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
668 sys.exit('Execution aborted: classes provided for comparisons are ' +
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
669 'less than two\n')
47
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
670
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
671 if comparison == "manyvsmany":
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
672 for i, j in it.combinations(class_pat.keys(), 2):
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
673
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
674 tmp = {}
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
675 count = 0
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
676 max_F_C = 0
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
677 for l1, l2 in zip(class_pat.get(i), class_pat.get(j)):
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
678 try:
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
679 stat_D, p_value = st.ks_2samp(l1, l2)
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
680 #sum(l1) da errore secondo me perchè ha null
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
681 avg = fold_change(sum(l1) / len(l1), sum(l2) / len(l2))
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
682 if not isinstance(avg, str):
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
683 if max_F_C < abs(avg):
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
684 max_F_C = abs(avg)
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
685 tmp[ids[count]] = [float(p_value), avg]
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
686 count += 1
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
687 except (TypeError, ZeroDivisionError):
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
688 count += 1
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
689 tab = 'result/' + i + '_vs_' + j + ' (Tabular Result).tsv'
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
690 tmp_csv = pd.DataFrame.from_dict(tmp, orient = "index")
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
691 tmp_csv = tmp_csv.reset_index()
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
692 header = ['ids', 'P_Value', 'Log2(fold change)']
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
693 tmp_csv.to_csv(tab, sep = '\t', index = False, header = header)
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
694
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
695 if create_svg or create_pdf:
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
696 if args.rules_selector == 'HMRcore' or (args.rules_selector == 'Custom'
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
697 and args.yes_no == 'yes'):
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
698 fix_map(tmp, core_map, threshold_P_V, threshold_F_C, max_F_C)
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
699 file_svg = 'result/' + i + '_vs_' + j + ' (SVG Map).svg'
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
700 with open(file_svg, 'wb') as new_map:
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
701 new_map.write(ET.tostring(core_map))
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
702
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
703
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
704 if create_pdf:
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
705 file_pdf = 'result/' + i + '_vs_' + j + ' (PDF Map).pdf'
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
706 renderPDF.drawToFile(svg2rlg(file_svg), file_pdf)
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
707
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
708 if not create_svg:
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
709 #Ho utilizzato il file svg per generare il pdf,
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
710 #ma l'utente non ne ha richiesto il ritorno, quindi
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
711 #lo elimino
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
712
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
713 os.remove('result/' + i + '_vs_' + j + ' (SVG Map).svg')
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
714 elif comparison == "onevsrest":
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
715 for single_cluster in class_pat.keys():
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
716 t = []
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
717 for k in class_pat.keys():
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
718 if k != single_cluster:
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
719 t.append(class_pat.get(k))
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
720 rest = []
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
721 for i in t:
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
722 rest = rest + i
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
723
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
724 tmp = {}
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
725 count = 0
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
726 max_F_C = 0
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
727
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
728 for l1, l2 in zip(rest, class_pat.get(single_cluster)):
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
729 try:
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
730 stat_D, p_value = st.ks_2samp(l1, l2)
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
731 avg = fold_change(sum(l1) / len(l1), sum(l2) / len(l2))
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
732 if not isinstance(avg, str):
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
733 if max_F_C < abs(avg):
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
734 max_F_C = abs(avg)
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
735 tmp[ids[count]] = [float(p_value), avg]
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
736 count += 1
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
737 except (TypeError, ZeroDivisionError):
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
738 count += 1
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
739 tab = 'result/' + single_cluster + '_vs_rest (Tabular Result).tsv'
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
740 tmp_csv = pd.DataFrame.from_dict(tmp, orient = "index")
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
741 tmp_csv = tmp_csv.reset_index()
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
742 header = ['ids', 'P_Value', 'Log2(fold change)']
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
743 tmp_csv.to_csv(tab, sep = '\t', index = False, header = header)
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
744
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
745 if create_svg or create_pdf:
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
746 if args.rules_selector == 'HMRcore' or (args.rules_selector == 'Custom'
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
747 and args.yes_no == 'yes'):
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
748 fix_map(tmp, core_map, threshold_P_V, threshold_F_C, max_F_C)
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
749 file_svg = 'result/' + single_cluster + '_vs_ rest (SVG Map).svg'
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
750 with open(file_svg, 'wb') as new_map:
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
751 new_map.write(ET.tostring(core_map))
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
752
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
753
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
754 if create_pdf:
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
755 file_pdf = 'result/' + single_cluster + '_vs_ rest (PDF Map).pdf'
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
756 renderPDF.drawToFile(svg2rlg(file_svg), file_pdf)
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
757
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
758 if not create_svg:
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
759 os.remove('result/' + single_cluster + '_vs_ rest (SVG Map).svg')
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
760
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
761 elif comparison == "onevsmany":
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
762 for i, j in it.combinations(class_pat.keys(), 2):
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
763
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
764 if i != control and j != control:
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
765 print(str(control) + " " + str(i) + " " + str(j))
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
766 #Se è un confronto fra elementi diversi dal controllo, skippo
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
767 continue
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
768
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
769 print('vado')
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
770 tmp = {}
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
771 count = 0
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
772 max_F_C = 0
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
773 for l1, l2 in zip(class_pat.get(i), class_pat.get(j)):
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
774 try:
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
775 stat_D, p_value = st.ks_2samp(l1, l2)
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
776 #sum(l1) da errore secondo me perchè ha null
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
777 avg = fold_change(sum(l1) / len(l1), sum(l2) / len(l2))
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
778 if not isinstance(avg, str):
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
779 if max_F_C < abs(avg):
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
780 max_F_C = abs(avg)
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
781 tmp[ids[count]] = [float(p_value), avg]
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
782 count += 1
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
783 except (TypeError, ZeroDivisionError):
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
784 count += 1
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
785 tab = 'result/' + i + '_vs_' + j + ' (Tabular Result).tsv'
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
786 tmp_csv = pd.DataFrame.from_dict(tmp, orient = "index")
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
787 tmp_csv = tmp_csv.reset_index()
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
788 header = ['ids', 'P_Value', 'Log2(fold change)']
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
789 tmp_csv.to_csv(tab, sep = '\t', index = False, header = header)
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
790
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
791 if create_svg or create_pdf:
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
792 if args.rules_selector == 'HMRcore' or (args.rules_selector == 'Custom'
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
793 and args.yes_no == 'yes'):
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
794 fix_map(tmp, core_map, threshold_P_V, threshold_F_C, max_F_C)
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
795 file_svg = 'result/' + i + '_vs_' + j + ' (SVG Map).svg'
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
796 with open(file_svg, 'wb') as new_map:
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
797 new_map.write(ET.tostring(core_map))
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
798
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
799
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
800 if create_pdf:
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
801 file_pdf = 'result/' + i + '_vs_' + j + ' (PDF Map).pdf'
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
802 renderPDF.drawToFile(svg2rlg(file_svg), file_pdf)
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
803
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
804 if not create_svg:
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
805 #Ho utilizzato il file svg per generare il pdf,
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
806 #ma l'utente non ne ha richiesto il ritorno, quindi
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
807 #lo elimino
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
808
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
809 os.remove('result/' + i + '_vs_' + j + ' (SVG Map).svg')
16
c71ac0bb12de Uploaded
bimib
parents: 13
diff changeset
810
47
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
811
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
812
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
813
0
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
814 return None
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
815
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
816 ############################ MAIN #############################################
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
817
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
818 def main():
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
819 args = process_args(sys.argv)
16
c71ac0bb12de Uploaded
bimib
parents: 13
diff changeset
820
c71ac0bb12de Uploaded
bimib
parents: 13
diff changeset
821 create_svg = check_bool(args.generate_svg)
c71ac0bb12de Uploaded
bimib
parents: 13
diff changeset
822 create_pdf = check_bool(args.generate_pdf)
35
7b1971251c63 Uploaded
bimib
parents: 34
diff changeset
823
47
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
824 if os.path.isdir('result') == False:
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
825 os.makedirs('result')
16
c71ac0bb12de Uploaded
bimib
parents: 13
diff changeset
826
c71ac0bb12de Uploaded
bimib
parents: 13
diff changeset
827 if args.rules_selector == 'HMRcore':
0
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
828 recon = pk.load(open(args.tool_dir + '/local/HMRcore_rules.p', 'rb'))
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
829 elif args.rules_selector == 'Recon':
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
830 recon = pk.load(open(args.tool_dir + '/local/Recon_rules.p', 'rb'))
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
831 elif args.rules_selector == 'Custom':
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
832 ids, rules, gene_in_rule = make_recon(args.custom)
47
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
833
0
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
834 class_pat = {}
16
c71ac0bb12de Uploaded
bimib
parents: 13
diff changeset
835
47
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
836 if args.option == 'datasets':
0
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
837 num = 1
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
838 for i, j in zip(args.input_datas, args.names):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
839 name = name_dataset(j, num)
47
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
840 resolve_rules = read_dataset(i, name)
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
841
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
842 resolve_rules.iloc[:, 0] = (resolve_rules.iloc[:, 0]).astype(str)
16
c71ac0bb12de Uploaded
bimib
parents: 13
diff changeset
843
47
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
844 ids = pd.Series.tolist(resolve_rules.iloc[:, 0])
16
c71ac0bb12de Uploaded
bimib
parents: 13
diff changeset
845
47
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
846 resolve_rules = resolve_rules.drop(resolve_rules.columns[[0]], axis=1)
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
847 resolve_rules = resolve_rules.replace({'None': None})
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
848 resolve_rules = resolve_rules.to_dict('list')
16
c71ac0bb12de Uploaded
bimib
parents: 13
diff changeset
849
47
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
850 #Converto i valori da str a float
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
851 to_float = lambda x: float(x) if (x != None) else None
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
852
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
853 resolve_rules_float = {}
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
854
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
855 for k in resolve_rules:
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
856 resolve_rules_float[k] = list(map(to_float, resolve_rules[k])); resolve_rules_float
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
857
0
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
858 if resolve_rules != None:
47
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
859 class_pat[name] = list(map(list, zip(*resolve_rules_float.values())))
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
860
0
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
861 num += 1
47
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
862
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
863 if args.option == 'dataset_class':
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
864 name = 'RAS'
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
865 resolve_rules = read_dataset(args.input_data, name)
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
866 resolve_rules.iloc[:, 0] = (resolve_rules.iloc[:, 0]).astype(str)
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
867
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
868 ids = pd.Series.tolist(resolve_rules.iloc[:, 0])
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
869
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
870 resolve_rules = resolve_rules.drop(resolve_rules.columns[[0]], axis=1)
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
871 resolve_rules = resolve_rules.replace({'None': None})
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
872 resolve_rules = resolve_rules.to_dict('list')
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
873
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
874 #Converto i valori da str a float
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
875 to_float = lambda x: float(x) if (x != None) else None
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
876
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
877 resolve_rules_float = {}
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
878
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
879 for k in resolve_rules:
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
880 resolve_rules_float[k] = list(map(to_float, resolve_rules[k])); resolve_rules_float
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
881
0
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
882 classes = read_dataset(args.input_class, 'class')
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
883 classes = classes.astype(str)
47
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
884
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
885 if resolve_rules_float != None:
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
886 class_pat = split_class(classes, resolve_rules_float)
28
e6831924df01 small fixes (elbow plot and output managment)
bimib
parents: 16
diff changeset
887
0
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
888 if args.rules_selector == 'Custom':
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
889 if args.yes_no == 'yes':
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
890 try:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
891 core_map = ET.parse(args.custom_map)
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
892 except (ET.XMLSyntaxError, ET.XMLSchemaParseError):
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
893 sys.exit('Execution aborted: custom map in wrong format')
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
894 elif args.yes_no == 'no':
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
895 core_map = ET.parse(args.tool_dir + '/local/HMRcoreMap.svg')
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
896 else:
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
897 core_map = ET.parse(args.tool_dir+'/local/HMRcoreMap.svg')
16
c71ac0bb12de Uploaded
bimib
parents: 13
diff changeset
898
47
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
899 maps(core_map, class_pat, ids, args.pValue, args.fChange, create_svg, create_pdf, args.comparison, args.control)
16
c71ac0bb12de Uploaded
bimib
parents: 13
diff changeset
900
c71ac0bb12de Uploaded
bimib
parents: 13
diff changeset
901 print('Execution succeded')
47
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
902
3af9d394367c Uploaded
bimib
parents: 35
diff changeset
903 return None
16
c71ac0bb12de Uploaded
bimib
parents: 13
diff changeset
904
0
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
905
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
906 ###############################################################################
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
907
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
908 if __name__ == "__main__":
23ac9cf12788 Uploaded
bimib
parents:
diff changeset
909 main()