annotate commons/pyRepetUnit/convCoord/ConvSetChr2Chunk.py @ 31:0ab839023fe4

Uploaded
author m-zytnicki
date Tue, 30 Apr 2013 14:33:21 -0400
parents 94ab73e8a190
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
18
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
1 from copy import deepcopy
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
2 from commons.core.sql.TableSetAdaptator import TableSetAdaptator
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
3 from commons.core.coord.Map import Map
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
4 from commons.core.coord.Set import Set
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
5 import os
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
6
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
7 class ConvSetChr2Chunk(object):
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
8
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
9 def __init__(self, db, table, chunk_table, outtable):
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
10 self._tablename = table
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
11 self._chunk_table = chunk_table
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
12 self._db = db
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
13 self._outtable = outtable
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
14
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
15 def convert(self):
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
16 """
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
17 Convert a 'set' table format.
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
18 """
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
19 temp_file = str(os.getpid()) + ".on_chunk"
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
20 fout = open(temp_file,'w')
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
21
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
22 str_mask = "SELECT * FROM "+\
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
23 self._chunk_table + " WHERE chr='%s' AND ("+\
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
24 "(%d BETWEEN LEAST(start,end) AND GREATEST(start,end))"+\
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
25 " OR (%d BETWEEN LEAST(start,end) AND GREATEST(start,end))"+\
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
26 " OR (%d <= LEAST(start,end) AND %d >= GREATEST(start,end)));"
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
27
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
28 iTSA = TableSetAdaptator(self._db, self._tablename)
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
29 path_num_list = iTSA.getIdList()
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
30
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
31 for path_num in path_num_list:
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
32 slist = iTSA.getSetListFromId(path_num)
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
33 for r in slist:
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
34 sql_cmd = str_mask%(r.seqname,r.getMin(),r.getMax(),r.getMin(),r.getMax())
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
35 self._db.execute(sql_cmd)
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
36 res = self._db.fetchall()
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
37 for i in res:
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
38 chunk = Map(i[0],i[1],int(i[2]),int(i[3]))
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
39
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
40 new_r = Set()
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
41 new_r = deepcopy(r)
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
42 new_r.seqname = chunk.name
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
43
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
44 if (r.start > chunk.start and r.start < chunk.end):
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
45 new_r.start = r.start - chunk.start + 1
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
46 if (r.end > chunk.start and r.end < chunk.end):
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
47 new_r.end = r.end - chunk.start + 1
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
48
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
49 if r.isOnDirectStrand():
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
50 if r.start <= chunk.start:
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
51 new_r.start = 1
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
52 if r.end >= chunk.end:
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
53 new_r.end = chunk.end - chunk.start + 1
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
54 else:
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
55 if r.end <= chunk.start:
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
56 new_r.end = 1
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
57 if r.start >= chunk.end:
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
58 new_r.start = chunk.end - chunk.start + 1
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
59
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
60 new_r.write(fout)
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
61
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
62 fout.close()
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
63
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
64 self._db.createTable(self._outtable, "set", temp_file)
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
65
94ab73e8a190 Uploaded
m-zytnicki
parents:
diff changeset
66 os.remove(temp_file)