forked from Tribler/dispersy
-
Notifications
You must be signed in to change notification settings - Fork 0
/
database.py
517 lines (414 loc) · 21 KB
/
database.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
"""
This module provides basic database functionalty and simple version control.
@author: Boudewijn Schoon
@organization: Technical University Delft
@contact: [email protected]
"""
from os import environ
import hashlib
import sqlite3
from .dprint import dprint
from .revision import update_revision_information
from .singleton import Singleton
if __debug__:
import thread
from threading import current_thread
__DEBUG_QUERIES__ = environ.has_key('DISPERSY_DEBUG_DATABASE_QUERIES')
if __DEBUG_QUERIES__:
from random import randint
from os.path import exists
from time import time
DB_DEBUG_FILE="database_queries_%d.txt" % randint(1,9999999)
while exists(DB_DEBUG_FILE):
DB_DEBUG_FILE="database_queries_%d.txt" % randint(1,9999999)
# update version information directly from SVN
update_revision_information("$HeadURL$", "$Revision$")
class IgnoreCommits(Exception):
"""
Ignore all commits made within the body of a 'with database:' clause.
with database:
# all commit statements are delayed until the database.__exit__
database.commit()
database.commit()
# raising IgnoreCommits causes all commits to be ignored
raise IgnoreCommits()
"""
def __init__(self):
super(IgnoreCommits, self).__init__("Ignore all commits made within __enter__ and __exit__")
class Database(Singleton):
def __init__(self, file_path):
"""
Initialize a new Database instance.
@param file_path: the path to the database file.
@type file_path: unicode
"""
if __debug__:
assert isinstance(file_path, unicode)
dprint(file_path)
self._debug_thread_ident = thread.get_ident()
self._file_path = file_path
self._connect(file_path)
# _commit_callbacks contains a list with functions that are called on each database commit
self._commit_callbacks = []
# Database.commit() is enabled when _pending_commits == 0. Database.commit() is disabled
# when _pending_commits > 0. A commit is required when _pending_commits > 1.
self._pending_commits = 0
# collect current database configuration
page_size = int(next(self._cursor.execute(u"PRAGMA page_size"))[0])
journal_mode = unicode(next(self._cursor.execute(u"PRAGMA journal_mode"))[0]).upper()
synchronous = unicode(next(self._cursor.execute(u"PRAGMA synchronous"))[0]).upper()
temp_store = unicode(next(self._cursor.execute(u"PRAGMA temp_store"))[0]).upper()
#
# PRAGMA page_size = bytes;
# http://www.sqlite.org/pragma.html#pragma_page_size
# Note that changing page_size has no effect unless performed on a new database or followed
# directly by VACUUM. Since we do not want the cost of VACUUM every time we load a
# database, existing databases must be upgraded.
#
if __debug__: dprint("PRAGMA page_size = 8192 (previously: ", page_size, ")")
if page_size < 8192:
# it is not possible to change page_size when WAL is enabled
if journal_mode == u"WAL":
self._cursor.executescript(u"PRAGMA journal_mode = DELETE")
journal_mode = u"DELETE"
self._cursor.execute(u"PRAGMA page_size = 8192")
self._cursor.execute(u"VACUUM")
page_size = 8192
#
# PRAGMA journal_mode = DELETE | TRUNCATE | PERSIST | MEMORY | WAL | OFF
# http://www.sqlite.org/pragma.html#pragma_page_size
#
if __debug__: dprint("PRAGMA journal_mode = WAL (previously: ", journal_mode, ")")
if not journal_mode == u"WAL":
self._cursor.execute(u"PRAGMA journal_mode = WAL")
#
# PRAGMA synchronous = 0 | OFF | 1 | NORMAL | 2 | FULL;
# http://www.sqlite.org/pragma.html#pragma_synchronous
#
if __debug__: dprint("PRAGMA synchronous = NORMAL (previously: ", synchronous, ")")
if not synchronous in (u"NORMAL", u"1"):
self._cursor.execute(u"PRAGMA synchronous = NORMAL")
#
# PRAGMA temp_store = 0 | DEFAULT | 1 | FILE | 2 | MEMORY;
# http://www.sqlite.org/pragma.html#pragma_temp_store
#
#DISABLED temp_store memory
# if __debug__: dprint("PRAGMA temp_store = MEMORY (previously: ", temp_store, ")")
# if not temp_store in (u"MEMORY", u"2"):
# self._cursor.execute(u"PRAGMA temp_store = MEMORY")
# check is the database contains an 'option' table
try:
count, = next(self.execute(u"SELECT COUNT(*) FROM sqlite_master WHERE type = 'table' AND name = 'option'"))
except StopIteration:
raise RuntimeError()
if count:
# get version from required 'option' table
try:
version, = next(self.execute(u"SELECT value FROM option WHERE key == 'database_version' LIMIT 1"))
except StopIteration:
# the 'database_version' key was not found
version = u"0"
else:
# the 'option' table probably hasn't been created yet
version = u"0"
self._init_database()
self._database_version = self.check_database(version)
assert isinstance(self._database_version, (int, long)), type(self._database_version)
def _connect(self, file_path):
self._connection = sqlite3.Connection(file_path)
# self._connection.setrollbackhook(self._on_rollback)
self._cursor = self._connection.cursor()
def _init_database(self):
pass
@property
def database_version(self):
return self._database_version
def file_path(self):
"""
The database filename including path.
"""
return self._file_path
def close(self, commit=True):
if commit:
self.commit()
self._cursor.close()
self._connection.close()
def __enter__(self):
"""
Enters a no-commit state. The commit will be performed by __exit__.
@return: The method self.execute
"""
assert self._debug_thread_ident == thread.get_ident()
if __debug__: dprint("disabling Database.commit()")
self._pending_commits = max(1, self._pending_commits)
return self
def __exit__(self, exc_type, exc_value, traceback):
"""
Leaves a no-commit state. A commit will be performed if Database.commit() was called while
in the no-commit state.
"""
assert self._debug_thread_ident == thread.get_ident()
self._pending_commits, pending_commits = 0, self._pending_commits
if exc_type is None:
if __debug__: dprint("enabling Database.commit()")
if pending_commits > 1:
if __debug__: dprint("performing ", pending_commits - 1, " pending commits")
self.commit()
return True
elif isinstance(exc_value, IgnoreCommits):
if __debug__: dprint("enabling Database.commit() without committing now")
return True
else:
#Niels 23-01-2013, an exception happened from within the with database block
#returning False to let Python reraise the exception.
return False
@property
def last_insert_rowid(self):
"""
The row id of the most recent insert query.
@rtype: int or long
"""
assert self._debug_thread_ident == thread.get_ident()
assert not self._cursor.lastrowid is None, "The last statement was NOT an insert query"
return self._cursor.lastrowid
@property
def changes(self):
"""
The number of changes that resulted from the most recent query.
@rtype: int or long
"""
assert self._debug_thread_ident == thread.get_ident()
return self._cursor.rowcount
# return self._connection.changes()
def execute(self, statement, bindings=()):
"""
Execute one SQL statement.
A SQL query must be presented in unicode format. This is to ensure that no unicode
exeptions occur when the bindings are merged into the statement.
Furthermore, the bindings may not contain any strings either. For a 'string' the unicode
type must be used. For a binary string the buffer(...) type must be used.
The SQL query may contain placeholder entries defined with a '?'. Each of these
placeholders will be used to store one value from bindings. The placeholders are filled by
sqlite and all proper escaping is done, making this the preferred way of adding variables to
the SQL query.
@param statement: the SQL statement that is to be executed.
@type statement: unicode
@param bindings: the values that must be set to the placeholders in statement.
@type bindings: tuple
@returns: unknown
@raise sqlite.Error: unknown
"""
assert self._debug_thread_ident == thread.get_ident(), "Calling Database.execute on the wrong thread (%s %d-%d)"%(current_thread().getName(), self._debug_thread_ident, thread.get_ident())
assert isinstance(statement, unicode), "The SQL statement must be given in unicode"
assert isinstance(bindings, (tuple, list, dict, set)), "The bindings must be a tuple, list, dictionary, or set"
assert all(lambda x: isinstance(x, str) for x in bindings), "The bindings may not contain a string. \nProvide unicode for TEXT and buffer(...) for BLOB. \nGiven types: %s" % str([type(binding) for binding in bindings])
try:
if __debug__: dprint(statement, " <-- ", bindings)
if __DEBUG_QUERIES__:
f = open(DB_DEBUG_FILE, 'a')
#Store the query plan with EXPLAIN QUERY PLAN to detect possible optimizations
debug_bindings = list(bindings)
for i, binding in enumerate(debug_bindings):
if isinstance(binding, buffer):
try:
binding = str(binding).encode("HEX")[:100] #try to show content of buffer, but a most 100 characters
except:
pass
debug_bindings[i] = binding
f.write('QueryDebug: (%f) %s %s\n' % (time(), statement, str(debug_bindings)))
for row in self._cursor.execute('EXPLAIN QUERY PLAN '+statement, bindings).fetchall():
f.write('%s %s %s\t%s\n' % row)
result = self._cursor.execute(statement, bindings)
if __DEBUG_QUERIES__:
f.write('QueryDebug: (%f) END\n' % time())
f.close()
return result
except sqlite3.Error:
dprint(exception=True, level="warning")
dprint("Filename: ", self._file_path, level="warning")
dprint(statement, level="warning")
raise
def executescript(self, statements):
assert self._debug_thread_ident == thread.get_ident(), "Calling Database.execute on the wrong thread"
assert isinstance(statements, unicode), "The SQL statement must be given in unicode"
try:
if __debug__: dprint(statements)
if __DEBUG_QUERIES__:
f = open(DB_DEBUG_FILE, 'a')
f.write('QueryDebug-script: (%f) %s\n' % (time(), statements))
result = self._cursor.executescript(statements)
if __DEBUG_QUERIES__:
f.write('QueryDebug-script: (%f) END\n' % time())
f.close()
return result
except sqlite3.Error:
dprint(exception=True, level="warning")
dprint("Filename: ", self._file_path, level="warning")
dprint(statements, level="warning")
raise
def executemany(self, statement, sequenceofbindings):
"""
Execute one SQL statement several times.
All SQL queries must be presented in unicode format. This is to ensure that no unicode
exeptions occur when the bindings are merged into the statement.
Furthermore, the bindings may not contain any strings either. For a 'string' the unicode
type must be used. For a binary string the buffer(...) type must be used.
The SQL query may contain placeholder entries defined with a '?'. Each of these
placeholders will be used to store one value from bindings. The placeholders are filled by
sqlite and all proper escaping is done, making this the preferred way of adding variables to
the SQL query.
@param statement: the SQL statement that is to be executed.
@type statement: unicode
@param bindings: a sequence of values that must be set to the placeholders in statement.
Each element in sequence is another tuple containing bindings.
@type bindings: list containing tuples
@returns: unknown
@raise sqlite.Error: unknown
"""
assert self._debug_thread_ident == thread.get_ident(), "Calling Database.execute on the wrong thread"
if __debug__:
# we allow GeneratorType but must convert it to a list in __debug__ mode since a
# generator can only iterate once
from types import GeneratorType
if isinstance(sequenceofbindings, GeneratorType):
sequenceofbindings = list(sequenceofbindings)
assert isinstance(statement, unicode), "The SQL statement must be given in unicode"
assert isinstance(sequenceofbindings, (tuple, list, set)), "The sequenceofbindings must be a tuple, list, or set"
assert all(isinstance(x, (tuple, list, dict, set)) for x in list(sequenceofbindings)), "The sequenceofbindings must be a list with tuples, lists, dictionaries, or sets"
assert not filter(lambda x: filter(lambda y: isinstance(y, str), x), list(sequenceofbindings)), "The bindings may not contain a string. \nProvide unicode for TEXT and buffer(...) for BLOB."
try:
if __debug__: dprint(statement)
if __DEBUG_QUERIES__:
f = open(DB_DEBUG_FILE, 'a')
f.write('QueryDebug-executemany: (%f) %s %s %d times\n' % (time(), statement, len(sequenceofbindings)))
for row in self._cursor.execute('EXPLAIN QUERY PLAN '+statement, sequenceofbindings[0]).fetchall():
f.write('%s %s %s\t%s\n' % row)
result = self._cursor.executemany(statement, sequenceofbindings)
if __DEBUG_QUERIES__:
f.write('QueryDebug-executemany: (%f) END\n' % time())
f.close()
return result
except sqlite3.Error:
dprint(exception=True)
dprint("Filename: ", self._file_path)
dprint(statement)
raise
def commit(self, exiting = False):
assert self._debug_thread_ident == thread.get_ident(), "Calling Database.commit on the wrong thread"
assert not (exiting and self._pending_commits), "No pending commits should be present when exiting"
if self._pending_commits:
if __debug__: dprint("defer COMMIT")
self._pending_commits += 1
return False
else:
if __debug__: dprint("COMMIT")
if __DEBUG_QUERIES__:
f = open(DB_DEBUG_FILE, 'a')
f.write('QueryDebug-commit: (%f)\n' % time())
result = self._connection.commit()
for callback in self._commit_callbacks:
try:
callback(exiting = exiting)
except Exception:
if __debug__: dprint(exception=True, stack=True)
if __DEBUG_QUERIES__:
f.write('QueryDebug-commit: (%f) END\n' % time())
f.close()
return result
# def _on_rollback(self):
# if __debug__: dprint("ROLLBACK", level="warning")
# raise DatabaseRollbackException(1)
def check_database(self, database_version):
"""
Check the database and upgrade if required.
This method is called once for each Database instance to ensure that the database structure
and version is correct. Each Database must contain one table of the structure below where
the database_version is stored. This value is used to keep track of the current database
version.
>>> CREATE TABLE option(key TEXT PRIMARY KEY, value BLOB);
>>> INSERT INTO option(key, value) VALUES('database_version', '1');
@param database_version: the current database_version value from the option table. This
value reverts to u'0' when the table could not be accessed.
@type database_version: unicode
"""
raise NotImplementedError()
def attach_commit_callback(self, func):
assert not func in self._commit_callbacks
self._commit_callbacks.append(func)
def detach_commit_callback(self, func):
assert func in self._commit_callbacks
self._commit_callbacks.remove(func)
class APSWDatabase(Database):
def _connect(self, file_path):
import apsw
self._connection = apsw.Connection(file_path)
self._cursor = self._connection.cursor()
def _init_database(self):
self.execute("BEGIN")
def execute(self, statement, bindings=()):
import apsw
assert self._debug_thread_ident == thread.get_ident(), "Calling Database.execute on the wrong thread"
assert isinstance(statement, unicode), "The SQL statement must be given in unicode"
assert isinstance(bindings, (tuple, list, dict)), "The bindings must be a tuple, list, or dictionary"
assert all(lambda x: isinstance(x, str) for x in bindings), "The bindings may not contain a string. \nProvide unicode for TEXT and buffer(...) for BLOB. \nGiven types: %s" % str([type(binding) for binding in bindings])
try:
if __debug__: dprint(statement, " <-- ", bindings)
return self._cursor.execute(statement, bindings)
except apsw.Error:
if __debug__:
dprint(exception=True, level="warning")
dprint("Filename: ", self._file_path, level="warning")
dprint(statement, level="warning")
dprint(bindings, level="warning")
raise
def executescript(self, statements):
return self.execute(statements)
def executemany(self, statement, sequenceofbindings):
import apsw
assert self._debug_thread_ident == thread.get_ident(), "Calling Database.execute on the wrong thread"
if __debug__:
# we allow GeneratorType but must convert it to a list in __debug__ mode since a
# generator can only iterate once
from types import GeneratorType
if isinstance(sequenceofbindings, GeneratorType):
sequenceofbindings = list(sequenceofbindings)
assert isinstance(statement, unicode), "The SQL statement must be given in unicode"
assert isinstance(sequenceofbindings, (tuple, list)), "The sequenceofbindings must be a list with tuples, lists, or dictionaries"
assert all(isinstance(x, (tuple, list, dict)) for x in list(sequenceofbindings)), "The sequenceofbindings must be a list with tuples, lists, or dictionaries"
assert not filter(lambda x: filter(lambda y: isinstance(y, str), x), list(sequenceofbindings)), "The bindings may not contain a string. \nProvide unicode for TEXT and buffer(...) for BLOB."
try:
if __debug__: dprint(statement)
return self._cursor.executemany(statement, sequenceofbindings)
except apsw.Error:
if __debug__:
dprint(exception=True)
dprint("Filename: ", self._file_path)
dprint(statement)
raise
@property
def last_insert_rowid(self):
"""
The row id of the most recent insert query.
@rtype: int or long
"""
assert self._debug_thread_ident == thread.get_ident()
assert not self._cursor.lastrowid is None, "The last statement was NOT an insert query"
return self._connection.last_insert_rowid()
@property
def changes(self):
"""
The number of changes that resulted from the most recent query.
@rtype: int or long
"""
assert self._debug_thread_ident == thread.get_ident()
return self._connection.totalchanges()
def commit(self):
assert self._debug_thread_ident == thread.get_ident(), "Calling Database.commit on the wrong thread"
if __debug__: dprint("COMMIT")
result = self.execute("COMMIT;BEGIN")
for callback in self._commit_callbacks:
try:
callback()
except Exception:
if __debug__: dprint(exception=True, stack=True)
return result