comparison SMART/Java/Python/mySql/MySqlTable.py @ 6:769e306b7933

Change the repository level.
author yufei-luo
date Fri, 18 Jan 2013 04:54:14 -0500
parents
children 94ab73e8a190
comparison
equal deleted inserted replaced
5:ea3082881bf8 6:769e306b7933
1 #
2 # Copyright INRA-URGI 2009-2010
3 #
4 # This software is governed by the CeCILL license under French law and
5 # abiding by the rules of distribution of free software. You can use,
6 # modify and/ or redistribute the software under the terms of the CeCILL
7 # license as circulated by CEA, CNRS and INRIA at the following URL
8 # "http://www.cecill.info".
9 #
10 # As a counterpart to the access to the source code and rights to copy,
11 # modify and redistribute granted by the license, users are provided only
12 # with a limited warranty and the software's author, the holder of the
13 # economic rights, and the successive licensors have only limited
14 # liability.
15 #
16 # In this respect, the user's attention is drawn to the risks associated
17 # with loading, using, modifying and/or developing or reproducing the
18 # software by the user in light of its specific status of free software,
19 # that may mean that it is complicated to manipulate, and that also
20 # therefore means that it is reserved for developers and experienced
21 # professionals having in-depth computer knowledge. Users are therefore
22 # encouraged to load and test the software's suitability as regards their
23 # requirements in conditions enabling the security of their systems and/or
24 # data to be ensured and, more generally, to use and operate it in the
25 # same conditions as regards security.
26 #
27 # The fact that you are presently reading this means that you have had
28 # knowledge of the CeCILL license and that you accept its terms.
29 #
30 import re
31 import sys
32
33 class MySqlTable(object):
34 """
35 Store a table of a mySQL database, used for transcripts or exons
36 Record a a name and a type (int, float, double) for each column
37 @ivar name: name of the table
38 @type name: string
39 @ivar variables: name of the columns
40 @type variables: list of string
41 @ivar types: type of the columns
42 @type types: dict of string
43 @ivar mySqlConnection: connection to a database
44 @type mySqlConnection: class L{MySqlConnection<MySqlConnection>}
45 @ivar nbLines: number of rows
46 @type nbLines: int
47 @ivar verbosity: verbosity
48 @type verbosity: int
49 """
50
51 def __init__(self, connection, name, verbosity = 0):
52 """
53 Constructor
54 Possibly retrieve column names and types if table exists
55 @param mySqlConnection: connection to a databas
56 @type mySqlConnection: class L{MySqlConnection<MySqlConnection>}
57 @param name: name of the table
58 @type name: string
59 @param verbosity: verbosity
60 @type verbosity: int
61 """
62 self.name = name
63 self.variables = []
64 self.types = {}
65 self.sizes = {}
66 self.nbLines = None
67 self.verbosity = verbosity
68 self.mySqlConnection = connection
69 queryTables = self.mySqlConnection.executeQuery("SELECT name FROM sqlite_master WHERE type LIKE 'table' AND name LIKE '%s'" % (self.name))
70 self.created = not queryTables.isEmpty()
71 if self.created:
72 queryFields = self.mySqlConnection.executeQuery("PRAGMA table_info('%s')" % (name))
73 for field in queryFields.getIterator():
74 if field[1] != "id":
75 self.variables.append(field[1])
76 self.types[field[1]] = field[2]
77 self.sizes[field[1]] = field[3]
78
79
80 def getName(self):
81 return self.name
82
83
84 def create(self, variables, types, sizes):
85 """
86 Create a table using give column names and types
87 @param variables: names of the columns
88 @type variables: list of string
89 @param types: types of the columns
90 @type types: dict of string
91 @param sizes: sizes of the types
92 @type sizes: dict of int
93 """
94 self.variables = variables
95 self.types = types
96 self.sizes = sizes
97 if self.created:
98 self.remove()
99 query = "CREATE TABLE '%s' (id INTEGER PRIMARY KEY" % (self.name)
100 for variable in variables:
101 query = "%s, %s %s(%d)" % (query, variable, types[variable], sizes[variable])
102 query += ")"
103 self.mySqlConnection.executeQuery(query)
104 self.created = True
105
106
107 def insertMany(self, lines):
108 """
109 Insert many lines
110 @param lines: the list of values
111 @type lines: list of lists
112 """
113 commands = []
114 for values in lines:
115 commands.append("INSERT INTO '%s' (%s) VALUES (%s)" % (self.name, ", ".join(self.variables), ", ".join([MySqlTable.formatSql(values[variable], self.types[variable], self.sizes[variable]) for variable in self.variables])))
116 self.mySqlConnection.executeManyQueries(commands)
117
118
119 def rename(self, name):
120 """
121 Rename the table
122 @param name: the new name
123 @type name: string
124 """
125 self.mySqlConnection.executeQuery("RENAME TABLE '%s' TO '%s'" % (self.name, name))
126 self.name = name
127
128
129 def copy(self, table):
130 """
131 Copy the given table this one
132 @param table: the table to be copied
133 @type table: class L{MySqlTable<MySqlTable>}
134 """
135 variables = []
136 types = {}
137 sizes = {}
138 fields = self.mySqlConnection.executeQuery("PRAGMA table_info(%s)" % (table.name))
139 for field in fields.getIterator():
140 if field[1] != "id":
141 variables.append(field[1])
142 m = re.search(r"(\w+)\((\d+)\)", field[2])
143 if m == None:
144 raise Exception("\nFormat %s in table %s is strange." % (field[2], table.name))
145 types[field[1]] = m.group(1)
146 sizes[field[1]] = int(m.group(2))
147 self.create(variables, types, sizes)
148 self.mySqlConnection.executeQuery("INSERT INTO '%s' SELECT * FROM %s" % (self.name, table.name))
149
150
151 def add(self, table):
152 """
153 Add the content of a table to this one
154 @param table: the table to be added
155 @type table: class L{MySqlTable<MySqlTable>}
156 """
157 self.mySqlConnection.executeQuery("INSERT INTO '%s' SELECT * FROM %s" % (self.name, table.name))
158 self.created = True
159
160
161 def exists(self):
162 """
163 Check if the table exists in mySQL
164 @return: true if it exits
165 """
166 return self.created
167
168
169 def remove(self):
170 """
171 Remove this table
172 """
173 if self.exists():
174 query = "DROP TABLE IF EXISTS '%s'" % (self.name)
175 self.mySqlConnection.executeQuery(query)
176 self.created = False
177
178
179 def clear(self):
180 """
181 Clear the content of this table
182 """
183 self.mySqlConnection.executeQuery("DELETE FROM '%s'" % (self.name))
184
185
186 def getNbElements(self):
187 """
188 Count the number of rows in the table
189 """
190 command = "SELECT COUNT(id) FROM '%s'" % (self.name)
191 query = self.mySqlConnection.executeQuery(command)
192 return int(query.getLine()[0])
193
194
195 def formatSql(self, value, type, size):
196 """
197 Format a value using MySQL encapsulation
198 """
199 if type.find("int") != -1:
200 return "%d" % value
201 if type.find("float") != -1:
202 return "%.10f" % value
203 if type.find("double") != -1:
204 return "%.20f" % value
205 if type.find("varchar") != -1:
206 if len(value) > size:
207 return "'%s'" % value[0:size]
208 return "'%s'" % value
209 raise Exception("Do not understand type %s" % (type))
210 formatSql = classmethod(formatSql)
211
212
213 def addLine(self, values):
214 """
215 Add a row to this table
216 @param values: the values of the row
217 @type values: dict
218 @return: the id of the added row
219 """
220 sqlValues = []
221 for variable in self.variables:
222 sqlValues.append(self.formatSql(values[variable], self.types[variable], self.sizes[variable]))
223 command = "INSERT INTO '%s' (%s) VALUES (%s)" % (self.name, ", ".join(self.variables), ", ".join(sqlValues))
224 id = self.mySqlConnection.executeQuery(command, True)
225 return id
226
227
228 def retrieveFromId(self, id):
229 """
230 Retrieve a row from its id
231 @param id: the id of the row
232 @type id: int
233 @return: the row
234 """
235 query = self.mySqlConnection.executeQuery("SELECT * FROM '%s' WHERE id = %d" % (self.name, id))
236 result = query.getLine()
237 if result == None:
238 raise Exception("Error! Id %d is not in the table %s!" % (id, self.name))
239 return result
240
241
242 def retrieveBulkFromId(self, ids):
243 """
244 Retrieve a row from its id
245 @param id: the ids of the row
246 @type id: list of int
247 @return: the row
248 """
249 if not ids:
250 return []
251 MAXSIZE = 1000
252 results = []
253 for batch in range(len(ids) / MAXSIZE + 1):
254 theseIds = ids[batch * MAXSIZE : (batch+1) * MAXSIZE]
255 if theseIds:
256 query = self.mySqlConnection.executeQuery("SELECT * FROM '%s' WHERE id IN (%s)" % (self.name, ", ".join(["%d" % (id) for id in theseIds])))
257 lines = query.getLines()
258 if len(lines) != len(theseIds):
259 raise Exception("Error! Some Ids of (%s) is are missing in the table '%s' (got %d instead of %d)!" % (", ".join(["%d" % (id) for id in theseIds]), self.name, len(lines)), len(theseIds))
260 results.extend(lines)
261 return results
262
263
264 def removeFromId(self, id):
265 """
266 Remove a row from its id
267 @param id: the id of the row
268 @type id: int
269 """
270 self.mySqlConnection.executeQuery("DELETE FROM '%s' WHERE id = %d" % (self.name, id))
271
272
273 def getIterator(self):
274 """
275 Iterate on the content of table
276 @return: iterator to the rows of the table
277 """
278 if not self.created:
279 return
280 MAXSIZE = 1000
281 query = self.mySqlConnection.executeQuery("SELECT count(id) FROM '%s'" % (self.name))
282 nbRows = int(query.getLine()[0])
283 for chunk in range((nbRows / MAXSIZE) + 1):
284 query = self.mySqlConnection.executeQuery("SELECT * FROM '%s' LIMIT %d, %d" % (self.name, chunk * MAXSIZE, MAXSIZE))
285 for line in query.getIterator():
286 yield line
287
288
289 def createIndex(self, indexName, values, unique = False, fullText = False):
290 """
291 Add an index on the table
292 @param indexName: name of the index
293 @type indexName: string
294 @param values: values to be indexed
295 @type values: string
296 @param unique: if the index is unique
297 @type unique: boolean
298 @param fullText: whether full text should be indexed
299 @type fullText: boolean
300 """
301 self.mySqlConnection.executeQuery("CREATE %s%sINDEX '%s' ON '%s' (%s)" % ("UNIQUE " if unique else "", "FULLTEXT " if fullText else "", indexName, self.name, ", ".join(values)))
302
303
304 def setDefaultTagValue(self, field, name, value):
305 """
306 Add a tag value
307 @param name: name of the tag
308 @type name: string
309 @param value: value of the tag
310 @type value: string or int
311 """
312 newData = {}
313 for line in MySqlTable.getIterator(self):
314 id = line[0]
315 tags = line[field]
316 if tags == '':
317 newTag = "%s=%s" % (name, value)
318 else:
319 newTag = "%s;%s=%s" % (tags, name, value)
320 if name not in [tag.split("=")[0] for tag in tags.split(";")]:
321 newData[id] = newTag
322 for id, tag in newData.iteritems():
323 query = self.mySqlConnection.executeQuery("UPDATE '%s' SET tags = '%s' WHERE id = %i" % (self.name, tag, id))
324
325
326
327 def show(self):
328 """
329 Drop the content of the current table
330 """
331 query = self.mySqlConnection.executeQuery("SELECT * FROM '%s'" % (self.name))
332 print query.getLines()
333
334