Mercurial > repos > yufei-luo > s_mart
diff commons/pyRepetUnit/convCoord/ConvPathChr2Chunk.py @ 18:94ab73e8a190
Uploaded
author | m-zytnicki |
---|---|
date | Mon, 29 Apr 2013 03:20:15 -0400 |
parents | |
children |
line wrap: on
line diff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/commons/pyRepetUnit/convCoord/ConvPathChr2Chunk.py Mon Apr 29 03:20:15 2013 -0400 @@ -0,0 +1,68 @@ +from copy import deepcopy +from commons.core.sql.TablePathAdaptator import TablePathAdaptator +from commons.core.coord.PathUtils import PathUtils +from commons.core.coord.Map import Map +from commons.core.coord.Path import Path +import os + +class ConvPathChr2Chunk(object): + + def __init__(self, db, table, chunk_table, outtable): + self._tablename = table + self._chunk_table = chunk_table + self._db = db + self._outtable = outtable + + def convert(self): + """ + Convert a 'path' table format. + """ + temp_file = str(os.getpid()) + ".on_chunk" + fout = open(temp_file,'w') + + str_mask = "SELECT * FROM "+\ + self._chunk_table + " WHERE chr='%s' AND ("+\ + "(%d BETWEEN LEAST(start,end) AND GREATEST(start,end))"+\ + " OR (%d BETWEEN LEAST(start,end) AND GREATEST(start,end))"+\ + " OR (%d <= LEAST(start,end) AND %d >= GREATEST(start,end)));" + + iTPA = TablePathAdaptator(self._db, self._tablename) + path_num_list = iTPA.getIdList() + + for path_num in path_num_list: + slist = iTPA.getPathListFromId(path_num) + for r in slist: + r_min, r_max = PathUtils.getQueryMinMaxFromPathList([r]) + sql_cmd = str_mask%(r.range_query.seqname,r_min,r_max,r_min,r_max) + self._db.execute(sql_cmd) + res = self._db.fetchall() + for i in res: + chunk = Map(i[0],i[1],int(i[2]),int(i[3])) + + new_r = Path() + new_r = deepcopy(r) + new_r.range_query.seqname = chunk.name + + if (r.range_query.start > chunk.start and r.range_query.start < chunk.end): + new_r.range_query.start = r.range_query.start - chunk.start + 1 + if (r.range_query.end > chunk.start and r.range_query.end < chunk.end): + new_r.range_query.end = r.range_query.end - chunk.start + 1 + + if r.range_query.isOnDirectStrand(): + if r.range_query.start <= chunk.start: + new_r.range_query.start = 1 + if r.range_query.end >= chunk.end: + new_r.range_query.end = chunk.end - chunk.start + 1 + else: + if r.range_query.end <= chunk.start: + new_r.range_query.end = 1 + if r.range_query.start >= chunk.end: + new_r.range_query.start = chunk.end - chunk.start + 1 + + new_r.write(fout) + + fout.close() + + self._db.createTable(self._outtable, "path", temp_file) + + os.remove(temp_file) \ No newline at end of file