Mercurial > repos > yufei-luo > s_mart
comparison SMART/Java/Python/mySql/MySqlTable.py @ 6:769e306b7933
Change the repository level.
author | yufei-luo |
---|---|
date | Fri, 18 Jan 2013 04:54:14 -0500 |
parents | |
children | 94ab73e8a190 |
comparison
equal
deleted
inserted
replaced
5:ea3082881bf8 | 6:769e306b7933 |
---|---|
1 # | |
2 # Copyright INRA-URGI 2009-2010 | |
3 # | |
4 # This software is governed by the CeCILL license under French law and | |
5 # abiding by the rules of distribution of free software. You can use, | |
6 # modify and/ or redistribute the software under the terms of the CeCILL | |
7 # license as circulated by CEA, CNRS and INRIA at the following URL | |
8 # "http://www.cecill.info". | |
9 # | |
10 # As a counterpart to the access to the source code and rights to copy, | |
11 # modify and redistribute granted by the license, users are provided only | |
12 # with a limited warranty and the software's author, the holder of the | |
13 # economic rights, and the successive licensors have only limited | |
14 # liability. | |
15 # | |
16 # In this respect, the user's attention is drawn to the risks associated | |
17 # with loading, using, modifying and/or developing or reproducing the | |
18 # software by the user in light of its specific status of free software, | |
19 # that may mean that it is complicated to manipulate, and that also | |
20 # therefore means that it is reserved for developers and experienced | |
21 # professionals having in-depth computer knowledge. Users are therefore | |
22 # encouraged to load and test the software's suitability as regards their | |
23 # requirements in conditions enabling the security of their systems and/or | |
24 # data to be ensured and, more generally, to use and operate it in the | |
25 # same conditions as regards security. | |
26 # | |
27 # The fact that you are presently reading this means that you have had | |
28 # knowledge of the CeCILL license and that you accept its terms. | |
29 # | |
30 import re | |
31 import sys | |
32 | |
33 class MySqlTable(object): | |
34 """ | |
35 Store a table of a mySQL database, used for transcripts or exons | |
36 Record a a name and a type (int, float, double) for each column | |
37 @ivar name: name of the table | |
38 @type name: string | |
39 @ivar variables: name of the columns | |
40 @type variables: list of string | |
41 @ivar types: type of the columns | |
42 @type types: dict of string | |
43 @ivar mySqlConnection: connection to a database | |
44 @type mySqlConnection: class L{MySqlConnection<MySqlConnection>} | |
45 @ivar nbLines: number of rows | |
46 @type nbLines: int | |
47 @ivar verbosity: verbosity | |
48 @type verbosity: int | |
49 """ | |
50 | |
51 def __init__(self, connection, name, verbosity = 0): | |
52 """ | |
53 Constructor | |
54 Possibly retrieve column names and types if table exists | |
55 @param mySqlConnection: connection to a databas | |
56 @type mySqlConnection: class L{MySqlConnection<MySqlConnection>} | |
57 @param name: name of the table | |
58 @type name: string | |
59 @param verbosity: verbosity | |
60 @type verbosity: int | |
61 """ | |
62 self.name = name | |
63 self.variables = [] | |
64 self.types = {} | |
65 self.sizes = {} | |
66 self.nbLines = None | |
67 self.verbosity = verbosity | |
68 self.mySqlConnection = connection | |
69 queryTables = self.mySqlConnection.executeQuery("SELECT name FROM sqlite_master WHERE type LIKE 'table' AND name LIKE '%s'" % (self.name)) | |
70 self.created = not queryTables.isEmpty() | |
71 if self.created: | |
72 queryFields = self.mySqlConnection.executeQuery("PRAGMA table_info('%s')" % (name)) | |
73 for field in queryFields.getIterator(): | |
74 if field[1] != "id": | |
75 self.variables.append(field[1]) | |
76 self.types[field[1]] = field[2] | |
77 self.sizes[field[1]] = field[3] | |
78 | |
79 | |
80 def getName(self): | |
81 return self.name | |
82 | |
83 | |
84 def create(self, variables, types, sizes): | |
85 """ | |
86 Create a table using give column names and types | |
87 @param variables: names of the columns | |
88 @type variables: list of string | |
89 @param types: types of the columns | |
90 @type types: dict of string | |
91 @param sizes: sizes of the types | |
92 @type sizes: dict of int | |
93 """ | |
94 self.variables = variables | |
95 self.types = types | |
96 self.sizes = sizes | |
97 if self.created: | |
98 self.remove() | |
99 query = "CREATE TABLE '%s' (id INTEGER PRIMARY KEY" % (self.name) | |
100 for variable in variables: | |
101 query = "%s, %s %s(%d)" % (query, variable, types[variable], sizes[variable]) | |
102 query += ")" | |
103 self.mySqlConnection.executeQuery(query) | |
104 self.created = True | |
105 | |
106 | |
107 def insertMany(self, lines): | |
108 """ | |
109 Insert many lines | |
110 @param lines: the list of values | |
111 @type lines: list of lists | |
112 """ | |
113 commands = [] | |
114 for values in lines: | |
115 commands.append("INSERT INTO '%s' (%s) VALUES (%s)" % (self.name, ", ".join(self.variables), ", ".join([MySqlTable.formatSql(values[variable], self.types[variable], self.sizes[variable]) for variable in self.variables]))) | |
116 self.mySqlConnection.executeManyQueries(commands) | |
117 | |
118 | |
119 def rename(self, name): | |
120 """ | |
121 Rename the table | |
122 @param name: the new name | |
123 @type name: string | |
124 """ | |
125 self.mySqlConnection.executeQuery("RENAME TABLE '%s' TO '%s'" % (self.name, name)) | |
126 self.name = name | |
127 | |
128 | |
129 def copy(self, table): | |
130 """ | |
131 Copy the given table this one | |
132 @param table: the table to be copied | |
133 @type table: class L{MySqlTable<MySqlTable>} | |
134 """ | |
135 variables = [] | |
136 types = {} | |
137 sizes = {} | |
138 fields = self.mySqlConnection.executeQuery("PRAGMA table_info(%s)" % (table.name)) | |
139 for field in fields.getIterator(): | |
140 if field[1] != "id": | |
141 variables.append(field[1]) | |
142 m = re.search(r"(\w+)\((\d+)\)", field[2]) | |
143 if m == None: | |
144 raise Exception("\nFormat %s in table %s is strange." % (field[2], table.name)) | |
145 types[field[1]] = m.group(1) | |
146 sizes[field[1]] = int(m.group(2)) | |
147 self.create(variables, types, sizes) | |
148 self.mySqlConnection.executeQuery("INSERT INTO '%s' SELECT * FROM %s" % (self.name, table.name)) | |
149 | |
150 | |
151 def add(self, table): | |
152 """ | |
153 Add the content of a table to this one | |
154 @param table: the table to be added | |
155 @type table: class L{MySqlTable<MySqlTable>} | |
156 """ | |
157 self.mySqlConnection.executeQuery("INSERT INTO '%s' SELECT * FROM %s" % (self.name, table.name)) | |
158 self.created = True | |
159 | |
160 | |
161 def exists(self): | |
162 """ | |
163 Check if the table exists in mySQL | |
164 @return: true if it exits | |
165 """ | |
166 return self.created | |
167 | |
168 | |
169 def remove(self): | |
170 """ | |
171 Remove this table | |
172 """ | |
173 if self.exists(): | |
174 query = "DROP TABLE IF EXISTS '%s'" % (self.name) | |
175 self.mySqlConnection.executeQuery(query) | |
176 self.created = False | |
177 | |
178 | |
179 def clear(self): | |
180 """ | |
181 Clear the content of this table | |
182 """ | |
183 self.mySqlConnection.executeQuery("DELETE FROM '%s'" % (self.name)) | |
184 | |
185 | |
186 def getNbElements(self): | |
187 """ | |
188 Count the number of rows in the table | |
189 """ | |
190 command = "SELECT COUNT(id) FROM '%s'" % (self.name) | |
191 query = self.mySqlConnection.executeQuery(command) | |
192 return int(query.getLine()[0]) | |
193 | |
194 | |
195 def formatSql(self, value, type, size): | |
196 """ | |
197 Format a value using MySQL encapsulation | |
198 """ | |
199 if type.find("int") != -1: | |
200 return "%d" % value | |
201 if type.find("float") != -1: | |
202 return "%.10f" % value | |
203 if type.find("double") != -1: | |
204 return "%.20f" % value | |
205 if type.find("varchar") != -1: | |
206 if len(value) > size: | |
207 return "'%s'" % value[0:size] | |
208 return "'%s'" % value | |
209 raise Exception("Do not understand type %s" % (type)) | |
210 formatSql = classmethod(formatSql) | |
211 | |
212 | |
213 def addLine(self, values): | |
214 """ | |
215 Add a row to this table | |
216 @param values: the values of the row | |
217 @type values: dict | |
218 @return: the id of the added row | |
219 """ | |
220 sqlValues = [] | |
221 for variable in self.variables: | |
222 sqlValues.append(self.formatSql(values[variable], self.types[variable], self.sizes[variable])) | |
223 command = "INSERT INTO '%s' (%s) VALUES (%s)" % (self.name, ", ".join(self.variables), ", ".join(sqlValues)) | |
224 id = self.mySqlConnection.executeQuery(command, True) | |
225 return id | |
226 | |
227 | |
228 def retrieveFromId(self, id): | |
229 """ | |
230 Retrieve a row from its id | |
231 @param id: the id of the row | |
232 @type id: int | |
233 @return: the row | |
234 """ | |
235 query = self.mySqlConnection.executeQuery("SELECT * FROM '%s' WHERE id = %d" % (self.name, id)) | |
236 result = query.getLine() | |
237 if result == None: | |
238 raise Exception("Error! Id %d is not in the table %s!" % (id, self.name)) | |
239 return result | |
240 | |
241 | |
242 def retrieveBulkFromId(self, ids): | |
243 """ | |
244 Retrieve a row from its id | |
245 @param id: the ids of the row | |
246 @type id: list of int | |
247 @return: the row | |
248 """ | |
249 if not ids: | |
250 return [] | |
251 MAXSIZE = 1000 | |
252 results = [] | |
253 for batch in range(len(ids) / MAXSIZE + 1): | |
254 theseIds = ids[batch * MAXSIZE : (batch+1) * MAXSIZE] | |
255 if theseIds: | |
256 query = self.mySqlConnection.executeQuery("SELECT * FROM '%s' WHERE id IN (%s)" % (self.name, ", ".join(["%d" % (id) for id in theseIds]))) | |
257 lines = query.getLines() | |
258 if len(lines) != len(theseIds): | |
259 raise Exception("Error! Some Ids of (%s) is are missing in the table '%s' (got %d instead of %d)!" % (", ".join(["%d" % (id) for id in theseIds]), self.name, len(lines)), len(theseIds)) | |
260 results.extend(lines) | |
261 return results | |
262 | |
263 | |
264 def removeFromId(self, id): | |
265 """ | |
266 Remove a row from its id | |
267 @param id: the id of the row | |
268 @type id: int | |
269 """ | |
270 self.mySqlConnection.executeQuery("DELETE FROM '%s' WHERE id = %d" % (self.name, id)) | |
271 | |
272 | |
273 def getIterator(self): | |
274 """ | |
275 Iterate on the content of table | |
276 @return: iterator to the rows of the table | |
277 """ | |
278 if not self.created: | |
279 return | |
280 MAXSIZE = 1000 | |
281 query = self.mySqlConnection.executeQuery("SELECT count(id) FROM '%s'" % (self.name)) | |
282 nbRows = int(query.getLine()[0]) | |
283 for chunk in range((nbRows / MAXSIZE) + 1): | |
284 query = self.mySqlConnection.executeQuery("SELECT * FROM '%s' LIMIT %d, %d" % (self.name, chunk * MAXSIZE, MAXSIZE)) | |
285 for line in query.getIterator(): | |
286 yield line | |
287 | |
288 | |
289 def createIndex(self, indexName, values, unique = False, fullText = False): | |
290 """ | |
291 Add an index on the table | |
292 @param indexName: name of the index | |
293 @type indexName: string | |
294 @param values: values to be indexed | |
295 @type values: string | |
296 @param unique: if the index is unique | |
297 @type unique: boolean | |
298 @param fullText: whether full text should be indexed | |
299 @type fullText: boolean | |
300 """ | |
301 self.mySqlConnection.executeQuery("CREATE %s%sINDEX '%s' ON '%s' (%s)" % ("UNIQUE " if unique else "", "FULLTEXT " if fullText else "", indexName, self.name, ", ".join(values))) | |
302 | |
303 | |
304 def setDefaultTagValue(self, field, name, value): | |
305 """ | |
306 Add a tag value | |
307 @param name: name of the tag | |
308 @type name: string | |
309 @param value: value of the tag | |
310 @type value: string or int | |
311 """ | |
312 newData = {} | |
313 for line in MySqlTable.getIterator(self): | |
314 id = line[0] | |
315 tags = line[field] | |
316 if tags == '': | |
317 newTag = "%s=%s" % (name, value) | |
318 else: | |
319 newTag = "%s;%s=%s" % (tags, name, value) | |
320 if name not in [tag.split("=")[0] for tag in tags.split(";")]: | |
321 newData[id] = newTag | |
322 for id, tag in newData.iteritems(): | |
323 query = self.mySqlConnection.executeQuery("UPDATE '%s' SET tags = '%s' WHERE id = %i" % (self.name, tag, id)) | |
324 | |
325 | |
326 | |
327 def show(self): | |
328 """ | |
329 Drop the content of the current table | |
330 """ | |
331 query = self.mySqlConnection.executeQuery("SELECT * FROM '%s'" % (self.name)) | |
332 print query.getLines() | |
333 | |
334 |