1 | #-----------------------------------------------------------------------
|
---|
2 | #
|
---|
3 | # Copyright (C) 2000, 2001 by Autonomous Zone Industries
|
---|
4 | # Copyright (C) 2002 Gregory P. Smith
|
---|
5 | #
|
---|
6 | # License: This is free software. You may use this software for any
|
---|
7 | # purpose including modification/redistribution, so long as
|
---|
8 | # this header remains intact and that you do not claim any
|
---|
9 | # rights of ownership or authorship of this software. This
|
---|
10 | # software has been tested, but no warranty is expressed or
|
---|
11 | # implied.
|
---|
12 | #
|
---|
13 | # -- Gregory P. Smith <greg@electricrain.com>
|
---|
14 |
|
---|
15 | # This provides a simple database table interface built on top of
|
---|
16 | # the Python BerkeleyDB 3 interface.
|
---|
17 | #
|
---|
18 | _cvsid = '$Id: dbtables.py 46858 2006-06-11 08:35:14Z neal.norwitz $'
|
---|
19 |
|
---|
20 | import re
|
---|
21 | import sys
|
---|
22 | import copy
|
---|
23 | import xdrlib
|
---|
24 | import random
|
---|
25 | from types import ListType, StringType
|
---|
26 | import cPickle as pickle
|
---|
27 |
|
---|
28 | try:
|
---|
29 | # For Pythons w/distutils pybsddb
|
---|
30 | from bsddb3.db import *
|
---|
31 | except ImportError:
|
---|
32 | # For Python 2.3
|
---|
33 | from bsddb.db import *
|
---|
34 |
|
---|
35 | # XXX(nnorwitz): is this correct? DBIncompleteError is conditional in _bsddb.c
|
---|
36 | try:
|
---|
37 | DBIncompleteError
|
---|
38 | except NameError:
|
---|
39 | class DBIncompleteError(Exception):
|
---|
40 | pass
|
---|
41 |
|
---|
42 | class TableDBError(StandardError):
|
---|
43 | pass
|
---|
44 | class TableAlreadyExists(TableDBError):
|
---|
45 | pass
|
---|
46 |
|
---|
47 |
|
---|
48 | class Cond:
|
---|
49 | """This condition matches everything"""
|
---|
50 | def __call__(self, s):
|
---|
51 | return 1
|
---|
52 |
|
---|
53 | class ExactCond(Cond):
|
---|
54 | """Acts as an exact match condition function"""
|
---|
55 | def __init__(self, strtomatch):
|
---|
56 | self.strtomatch = strtomatch
|
---|
57 | def __call__(self, s):
|
---|
58 | return s == self.strtomatch
|
---|
59 |
|
---|
60 | class PrefixCond(Cond):
|
---|
61 | """Acts as a condition function for matching a string prefix"""
|
---|
62 | def __init__(self, prefix):
|
---|
63 | self.prefix = prefix
|
---|
64 | def __call__(self, s):
|
---|
65 | return s[:len(self.prefix)] == self.prefix
|
---|
66 |
|
---|
67 | class PostfixCond(Cond):
|
---|
68 | """Acts as a condition function for matching a string postfix"""
|
---|
69 | def __init__(self, postfix):
|
---|
70 | self.postfix = postfix
|
---|
71 | def __call__(self, s):
|
---|
72 | return s[-len(self.postfix):] == self.postfix
|
---|
73 |
|
---|
74 | class LikeCond(Cond):
|
---|
75 | """
|
---|
76 | Acts as a function that will match using an SQL 'LIKE' style
|
---|
77 | string. Case insensitive and % signs are wild cards.
|
---|
78 | This isn't perfect but it should work for the simple common cases.
|
---|
79 | """
|
---|
80 | def __init__(self, likestr, re_flags=re.IGNORECASE):
|
---|
81 | # escape python re characters
|
---|
82 | chars_to_escape = '.*+()[]?'
|
---|
83 | for char in chars_to_escape :
|
---|
84 | likestr = likestr.replace(char, '\\'+char)
|
---|
85 | # convert %s to wildcards
|
---|
86 | self.likestr = likestr.replace('%', '.*')
|
---|
87 | self.re = re.compile('^'+self.likestr+'$', re_flags)
|
---|
88 | def __call__(self, s):
|
---|
89 | return self.re.match(s)
|
---|
90 |
|
---|
91 | #
|
---|
92 | # keys used to store database metadata
|
---|
93 | #
|
---|
94 | _table_names_key = '__TABLE_NAMES__' # list of the tables in this db
|
---|
95 | _columns = '._COLUMNS__' # table_name+this key contains a list of columns
|
---|
96 |
|
---|
97 | def _columns_key(table):
|
---|
98 | return table + _columns
|
---|
99 |
|
---|
100 | #
|
---|
101 | # these keys are found within table sub databases
|
---|
102 | #
|
---|
103 | _data = '._DATA_.' # this+column+this+rowid key contains table data
|
---|
104 | _rowid = '._ROWID_.' # this+rowid+this key contains a unique entry for each
|
---|
105 | # row in the table. (no data is stored)
|
---|
106 | _rowid_str_len = 8 # length in bytes of the unique rowid strings
|
---|
107 |
|
---|
108 | def _data_key(table, col, rowid):
|
---|
109 | return table + _data + col + _data + rowid
|
---|
110 |
|
---|
111 | def _search_col_data_key(table, col):
|
---|
112 | return table + _data + col + _data
|
---|
113 |
|
---|
114 | def _search_all_data_key(table):
|
---|
115 | return table + _data
|
---|
116 |
|
---|
117 | def _rowid_key(table, rowid):
|
---|
118 | return table + _rowid + rowid + _rowid
|
---|
119 |
|
---|
120 | def _search_rowid_key(table):
|
---|
121 | return table + _rowid
|
---|
122 |
|
---|
123 | def contains_metastrings(s) :
|
---|
124 | """Verify that the given string does not contain any
|
---|
125 | metadata strings that might interfere with dbtables database operation.
|
---|
126 | """
|
---|
127 | if (s.find(_table_names_key) >= 0 or
|
---|
128 | s.find(_columns) >= 0 or
|
---|
129 | s.find(_data) >= 0 or
|
---|
130 | s.find(_rowid) >= 0):
|
---|
131 | # Then
|
---|
132 | return 1
|
---|
133 | else:
|
---|
134 | return 0
|
---|
135 |
|
---|
136 |
|
---|
137 | class bsdTableDB :
|
---|
138 | def __init__(self, filename, dbhome, create=0, truncate=0, mode=0600,
|
---|
139 | recover=0, dbflags=0):
|
---|
140 | """bsdTableDB(filename, dbhome, create=0, truncate=0, mode=0600)
|
---|
141 |
|
---|
142 | Open database name in the dbhome BerkeleyDB directory.
|
---|
143 | Use keyword arguments when calling this constructor.
|
---|
144 | """
|
---|
145 | self.db = None
|
---|
146 | myflags = DB_THREAD
|
---|
147 | if create:
|
---|
148 | myflags |= DB_CREATE
|
---|
149 | flagsforenv = (DB_INIT_MPOOL | DB_INIT_LOCK | DB_INIT_LOG |
|
---|
150 | DB_INIT_TXN | dbflags)
|
---|
151 | # DB_AUTO_COMMIT isn't a valid flag for env.open()
|
---|
152 | try:
|
---|
153 | dbflags |= DB_AUTO_COMMIT
|
---|
154 | except AttributeError:
|
---|
155 | pass
|
---|
156 | if recover:
|
---|
157 | flagsforenv = flagsforenv | DB_RECOVER
|
---|
158 | self.env = DBEnv()
|
---|
159 | # enable auto deadlock avoidance
|
---|
160 | self.env.set_lk_detect(DB_LOCK_DEFAULT)
|
---|
161 | self.env.open(dbhome, myflags | flagsforenv)
|
---|
162 | if truncate:
|
---|
163 | myflags |= DB_TRUNCATE
|
---|
164 | self.db = DB(self.env)
|
---|
165 | # this code relies on DBCursor.set* methods to raise exceptions
|
---|
166 | # rather than returning None
|
---|
167 | self.db.set_get_returns_none(1)
|
---|
168 | # allow duplicate entries [warning: be careful w/ metadata]
|
---|
169 | self.db.set_flags(DB_DUP)
|
---|
170 | self.db.open(filename, DB_BTREE, dbflags | myflags, mode)
|
---|
171 | self.dbfilename = filename
|
---|
172 | # Initialize the table names list if this is a new database
|
---|
173 | txn = self.env.txn_begin()
|
---|
174 | try:
|
---|
175 | if not self.db.has_key(_table_names_key, txn):
|
---|
176 | self.db.put(_table_names_key, pickle.dumps([], 1), txn=txn)
|
---|
177 | # Yes, bare except
|
---|
178 | except:
|
---|
179 | txn.abort()
|
---|
180 | raise
|
---|
181 | else:
|
---|
182 | txn.commit()
|
---|
183 | # TODO verify more of the database's metadata?
|
---|
184 | self.__tablecolumns = {}
|
---|
185 |
|
---|
186 | def __del__(self):
|
---|
187 | self.close()
|
---|
188 |
|
---|
189 | def close(self):
|
---|
190 | if self.db is not None:
|
---|
191 | self.db.close()
|
---|
192 | self.db = None
|
---|
193 | if self.env is not None:
|
---|
194 | self.env.close()
|
---|
195 | self.env = None
|
---|
196 |
|
---|
197 | def checkpoint(self, mins=0):
|
---|
198 | try:
|
---|
199 | self.env.txn_checkpoint(mins)
|
---|
200 | except DBIncompleteError:
|
---|
201 | pass
|
---|
202 |
|
---|
203 | def sync(self):
|
---|
204 | try:
|
---|
205 | self.db.sync()
|
---|
206 | except DBIncompleteError:
|
---|
207 | pass
|
---|
208 |
|
---|
209 | def _db_print(self) :
|
---|
210 | """Print the database to stdout for debugging"""
|
---|
211 | print "******** Printing raw database for debugging ********"
|
---|
212 | cur = self.db.cursor()
|
---|
213 | try:
|
---|
214 | key, data = cur.first()
|
---|
215 | while 1:
|
---|
216 | print repr({key: data})
|
---|
217 | next = cur.next()
|
---|
218 | if next:
|
---|
219 | key, data = next
|
---|
220 | else:
|
---|
221 | cur.close()
|
---|
222 | return
|
---|
223 | except DBNotFoundError:
|
---|
224 | cur.close()
|
---|
225 |
|
---|
226 |
|
---|
227 | def CreateTable(self, table, columns):
|
---|
228 | """CreateTable(table, columns) - Create a new table in the database.
|
---|
229 |
|
---|
230 | raises TableDBError if it already exists or for other DB errors.
|
---|
231 | """
|
---|
232 | assert isinstance(columns, ListType)
|
---|
233 | txn = None
|
---|
234 | try:
|
---|
235 | # checking sanity of the table and column names here on
|
---|
236 | # table creation will prevent problems elsewhere.
|
---|
237 | if contains_metastrings(table):
|
---|
238 | raise ValueError(
|
---|
239 | "bad table name: contains reserved metastrings")
|
---|
240 | for column in columns :
|
---|
241 | if contains_metastrings(column):
|
---|
242 | raise ValueError(
|
---|
243 | "bad column name: contains reserved metastrings")
|
---|
244 |
|
---|
245 | columnlist_key = _columns_key(table)
|
---|
246 | if self.db.has_key(columnlist_key):
|
---|
247 | raise TableAlreadyExists, "table already exists"
|
---|
248 |
|
---|
249 | txn = self.env.txn_begin()
|
---|
250 | # store the table's column info
|
---|
251 | self.db.put(columnlist_key, pickle.dumps(columns, 1), txn=txn)
|
---|
252 |
|
---|
253 | # add the table name to the tablelist
|
---|
254 | tablelist = pickle.loads(self.db.get(_table_names_key, txn=txn,
|
---|
255 | flags=DB_RMW))
|
---|
256 | tablelist.append(table)
|
---|
257 | # delete 1st, in case we opened with DB_DUP
|
---|
258 | self.db.delete(_table_names_key, txn)
|
---|
259 | self.db.put(_table_names_key, pickle.dumps(tablelist, 1), txn=txn)
|
---|
260 |
|
---|
261 | txn.commit()
|
---|
262 | txn = None
|
---|
263 | except DBError, dberror:
|
---|
264 | if txn:
|
---|
265 | txn.abort()
|
---|
266 | raise TableDBError, dberror[1]
|
---|
267 |
|
---|
268 |
|
---|
269 | def ListTableColumns(self, table):
|
---|
270 | """Return a list of columns in the given table.
|
---|
271 | [] if the table doesn't exist.
|
---|
272 | """
|
---|
273 | assert isinstance(table, StringType)
|
---|
274 | if contains_metastrings(table):
|
---|
275 | raise ValueError, "bad table name: contains reserved metastrings"
|
---|
276 |
|
---|
277 | columnlist_key = _columns_key(table)
|
---|
278 | if not self.db.has_key(columnlist_key):
|
---|
279 | return []
|
---|
280 | pickledcolumnlist = self.db.get(columnlist_key)
|
---|
281 | if pickledcolumnlist:
|
---|
282 | return pickle.loads(pickledcolumnlist)
|
---|
283 | else:
|
---|
284 | return []
|
---|
285 |
|
---|
286 | def ListTables(self):
|
---|
287 | """Return a list of tables in this database."""
|
---|
288 | pickledtablelist = self.db.get(_table_names_key)
|
---|
289 | if pickledtablelist:
|
---|
290 | return pickle.loads(pickledtablelist)
|
---|
291 | else:
|
---|
292 | return []
|
---|
293 |
|
---|
294 | def CreateOrExtendTable(self, table, columns):
|
---|
295 | """CreateOrExtendTable(table, columns)
|
---|
296 |
|
---|
297 | Create a new table in the database.
|
---|
298 |
|
---|
299 | If a table of this name already exists, extend it to have any
|
---|
300 | additional columns present in the given list as well as
|
---|
301 | all of its current columns.
|
---|
302 | """
|
---|
303 | assert isinstance(columns, ListType)
|
---|
304 | try:
|
---|
305 | self.CreateTable(table, columns)
|
---|
306 | except TableAlreadyExists:
|
---|
307 | # the table already existed, add any new columns
|
---|
308 | txn = None
|
---|
309 | try:
|
---|
310 | columnlist_key = _columns_key(table)
|
---|
311 | txn = self.env.txn_begin()
|
---|
312 |
|
---|
313 | # load the current column list
|
---|
314 | oldcolumnlist = pickle.loads(
|
---|
315 | self.db.get(columnlist_key, txn=txn, flags=DB_RMW))
|
---|
316 | # create a hash table for fast lookups of column names in the
|
---|
317 | # loop below
|
---|
318 | oldcolumnhash = {}
|
---|
319 | for c in oldcolumnlist:
|
---|
320 | oldcolumnhash[c] = c
|
---|
321 |
|
---|
322 | # create a new column list containing both the old and new
|
---|
323 | # column names
|
---|
324 | newcolumnlist = copy.copy(oldcolumnlist)
|
---|
325 | for c in columns:
|
---|
326 | if not oldcolumnhash.has_key(c):
|
---|
327 | newcolumnlist.append(c)
|
---|
328 |
|
---|
329 | # store the table's new extended column list
|
---|
330 | if newcolumnlist != oldcolumnlist :
|
---|
331 | # delete the old one first since we opened with DB_DUP
|
---|
332 | self.db.delete(columnlist_key, txn)
|
---|
333 | self.db.put(columnlist_key,
|
---|
334 | pickle.dumps(newcolumnlist, 1),
|
---|
335 | txn=txn)
|
---|
336 |
|
---|
337 | txn.commit()
|
---|
338 | txn = None
|
---|
339 |
|
---|
340 | self.__load_column_info(table)
|
---|
341 | except DBError, dberror:
|
---|
342 | if txn:
|
---|
343 | txn.abort()
|
---|
344 | raise TableDBError, dberror[1]
|
---|
345 |
|
---|
346 |
|
---|
347 | def __load_column_info(self, table) :
|
---|
348 | """initialize the self.__tablecolumns dict"""
|
---|
349 | # check the column names
|
---|
350 | try:
|
---|
351 | tcolpickles = self.db.get(_columns_key(table))
|
---|
352 | except DBNotFoundError:
|
---|
353 | raise TableDBError, "unknown table: %r" % (table,)
|
---|
354 | if not tcolpickles:
|
---|
355 | raise TableDBError, "unknown table: %r" % (table,)
|
---|
356 | self.__tablecolumns[table] = pickle.loads(tcolpickles)
|
---|
357 |
|
---|
358 | def __new_rowid(self, table, txn) :
|
---|
359 | """Create a new unique row identifier"""
|
---|
360 | unique = 0
|
---|
361 | while not unique:
|
---|
362 | # Generate a random 64-bit row ID string
|
---|
363 | # (note: this code has <64 bits of randomness
|
---|
364 | # but it's plenty for our database id needs!)
|
---|
365 | p = xdrlib.Packer()
|
---|
366 | p.pack_int(int(random.random()*2147483647))
|
---|
367 | p.pack_int(int(random.random()*2147483647))
|
---|
368 | newid = p.get_buffer()
|
---|
369 |
|
---|
370 | # Guarantee uniqueness by adding this key to the database
|
---|
371 | try:
|
---|
372 | self.db.put(_rowid_key(table, newid), None, txn=txn,
|
---|
373 | flags=DB_NOOVERWRITE)
|
---|
374 | except DBKeyExistError:
|
---|
375 | pass
|
---|
376 | else:
|
---|
377 | unique = 1
|
---|
378 |
|
---|
379 | return newid
|
---|
380 |
|
---|
381 |
|
---|
382 | def Insert(self, table, rowdict) :
|
---|
383 | """Insert(table, datadict) - Insert a new row into the table
|
---|
384 | using the keys+values from rowdict as the column values.
|
---|
385 | """
|
---|
386 | txn = None
|
---|
387 | try:
|
---|
388 | if not self.db.has_key(_columns_key(table)):
|
---|
389 | raise TableDBError, "unknown table"
|
---|
390 |
|
---|
391 | # check the validity of each column name
|
---|
392 | if not self.__tablecolumns.has_key(table):
|
---|
393 | self.__load_column_info(table)
|
---|
394 | for column in rowdict.keys() :
|
---|
395 | if not self.__tablecolumns[table].count(column):
|
---|
396 | raise TableDBError, "unknown column: %r" % (column,)
|
---|
397 |
|
---|
398 | # get a unique row identifier for this row
|
---|
399 | txn = self.env.txn_begin()
|
---|
400 | rowid = self.__new_rowid(table, txn=txn)
|
---|
401 |
|
---|
402 | # insert the row values into the table database
|
---|
403 | for column, dataitem in rowdict.items():
|
---|
404 | # store the value
|
---|
405 | self.db.put(_data_key(table, column, rowid), dataitem, txn=txn)
|
---|
406 |
|
---|
407 | txn.commit()
|
---|
408 | txn = None
|
---|
409 |
|
---|
410 | except DBError, dberror:
|
---|
411 | # WIBNI we could just abort the txn and re-raise the exception?
|
---|
412 | # But no, because TableDBError is not related to DBError via
|
---|
413 | # inheritance, so it would be backwards incompatible. Do the next
|
---|
414 | # best thing.
|
---|
415 | info = sys.exc_info()
|
---|
416 | if txn:
|
---|
417 | txn.abort()
|
---|
418 | self.db.delete(_rowid_key(table, rowid))
|
---|
419 | raise TableDBError, dberror[1], info[2]
|
---|
420 |
|
---|
421 |
|
---|
422 | def Modify(self, table, conditions={}, mappings={}):
|
---|
423 | """Modify(table, conditions={}, mappings={}) - Modify items in rows matching 'conditions' using mapping functions in 'mappings'
|
---|
424 |
|
---|
425 | * table - the table name
|
---|
426 | * conditions - a dictionary keyed on column names containing
|
---|
427 | a condition callable expecting the data string as an
|
---|
428 | argument and returning a boolean.
|
---|
429 | * mappings - a dictionary keyed on column names containing a
|
---|
430 | condition callable expecting the data string as an argument and
|
---|
431 | returning the new string for that column.
|
---|
432 | """
|
---|
433 | try:
|
---|
434 | matching_rowids = self.__Select(table, [], conditions)
|
---|
435 |
|
---|
436 | # modify only requested columns
|
---|
437 | columns = mappings.keys()
|
---|
438 | for rowid in matching_rowids.keys():
|
---|
439 | txn = None
|
---|
440 | try:
|
---|
441 | for column in columns:
|
---|
442 | txn = self.env.txn_begin()
|
---|
443 | # modify the requested column
|
---|
444 | try:
|
---|
445 | dataitem = self.db.get(
|
---|
446 | _data_key(table, column, rowid),
|
---|
447 | txn)
|
---|
448 | self.db.delete(
|
---|
449 | _data_key(table, column, rowid),
|
---|
450 | txn)
|
---|
451 | except DBNotFoundError:
|
---|
452 | # XXXXXXX row key somehow didn't exist, assume no
|
---|
453 | # error
|
---|
454 | dataitem = None
|
---|
455 | dataitem = mappings[column](dataitem)
|
---|
456 | if dataitem <> None:
|
---|
457 | self.db.put(
|
---|
458 | _data_key(table, column, rowid),
|
---|
459 | dataitem, txn=txn)
|
---|
460 | txn.commit()
|
---|
461 | txn = None
|
---|
462 |
|
---|
463 | # catch all exceptions here since we call unknown callables
|
---|
464 | except:
|
---|
465 | if txn:
|
---|
466 | txn.abort()
|
---|
467 | raise
|
---|
468 |
|
---|
469 | except DBError, dberror:
|
---|
470 | raise TableDBError, dberror[1]
|
---|
471 |
|
---|
472 | def Delete(self, table, conditions={}):
|
---|
473 | """Delete(table, conditions) - Delete items matching the given
|
---|
474 | conditions from the table.
|
---|
475 |
|
---|
476 | * conditions - a dictionary keyed on column names containing
|
---|
477 | condition functions expecting the data string as an
|
---|
478 | argument and returning a boolean.
|
---|
479 | """
|
---|
480 | try:
|
---|
481 | matching_rowids = self.__Select(table, [], conditions)
|
---|
482 |
|
---|
483 | # delete row data from all columns
|
---|
484 | columns = self.__tablecolumns[table]
|
---|
485 | for rowid in matching_rowids.keys():
|
---|
486 | txn = None
|
---|
487 | try:
|
---|
488 | txn = self.env.txn_begin()
|
---|
489 | for column in columns:
|
---|
490 | # delete the data key
|
---|
491 | try:
|
---|
492 | self.db.delete(_data_key(table, column, rowid),
|
---|
493 | txn)
|
---|
494 | except DBNotFoundError:
|
---|
495 | # XXXXXXX column may not exist, assume no error
|
---|
496 | pass
|
---|
497 |
|
---|
498 | try:
|
---|
499 | self.db.delete(_rowid_key(table, rowid), txn)
|
---|
500 | except DBNotFoundError:
|
---|
501 | # XXXXXXX row key somehow didn't exist, assume no error
|
---|
502 | pass
|
---|
503 | txn.commit()
|
---|
504 | txn = None
|
---|
505 | except DBError, dberror:
|
---|
506 | if txn:
|
---|
507 | txn.abort()
|
---|
508 | raise
|
---|
509 | except DBError, dberror:
|
---|
510 | raise TableDBError, dberror[1]
|
---|
511 |
|
---|
512 |
|
---|
513 | def Select(self, table, columns, conditions={}):
|
---|
514 | """Select(table, columns, conditions) - retrieve specific row data
|
---|
515 | Returns a list of row column->value mapping dictionaries.
|
---|
516 |
|
---|
517 | * columns - a list of which column data to return. If
|
---|
518 | columns is None, all columns will be returned.
|
---|
519 | * conditions - a dictionary keyed on column names
|
---|
520 | containing callable conditions expecting the data string as an
|
---|
521 | argument and returning a boolean.
|
---|
522 | """
|
---|
523 | try:
|
---|
524 | if not self.__tablecolumns.has_key(table):
|
---|
525 | self.__load_column_info(table)
|
---|
526 | if columns is None:
|
---|
527 | columns = self.__tablecolumns[table]
|
---|
528 | matching_rowids = self.__Select(table, columns, conditions)
|
---|
529 | except DBError, dberror:
|
---|
530 | raise TableDBError, dberror[1]
|
---|
531 | # return the matches as a list of dictionaries
|
---|
532 | return matching_rowids.values()
|
---|
533 |
|
---|
534 |
|
---|
535 | def __Select(self, table, columns, conditions):
|
---|
536 | """__Select() - Used to implement Select and Delete (above)
|
---|
537 | Returns a dictionary keyed on rowids containing dicts
|
---|
538 | holding the row data for columns listed in the columns param
|
---|
539 | that match the given conditions.
|
---|
540 | * conditions is a dictionary keyed on column names
|
---|
541 | containing callable conditions expecting the data string as an
|
---|
542 | argument and returning a boolean.
|
---|
543 | """
|
---|
544 | # check the validity of each column name
|
---|
545 | if not self.__tablecolumns.has_key(table):
|
---|
546 | self.__load_column_info(table)
|
---|
547 | if columns is None:
|
---|
548 | columns = self.tablecolumns[table]
|
---|
549 | for column in (columns + conditions.keys()):
|
---|
550 | if not self.__tablecolumns[table].count(column):
|
---|
551 | raise TableDBError, "unknown column: %r" % (column,)
|
---|
552 |
|
---|
553 | # keyed on rows that match so far, containings dicts keyed on
|
---|
554 | # column names containing the data for that row and column.
|
---|
555 | matching_rowids = {}
|
---|
556 | # keys are rowids that do not match
|
---|
557 | rejected_rowids = {}
|
---|
558 |
|
---|
559 | # attempt to sort the conditions in such a way as to minimize full
|
---|
560 | # column lookups
|
---|
561 | def cmp_conditions(atuple, btuple):
|
---|
562 | a = atuple[1]
|
---|
563 | b = btuple[1]
|
---|
564 | if type(a) is type(b):
|
---|
565 | if isinstance(a, PrefixCond) and isinstance(b, PrefixCond):
|
---|
566 | # longest prefix first
|
---|
567 | return cmp(len(b.prefix), len(a.prefix))
|
---|
568 | if isinstance(a, LikeCond) and isinstance(b, LikeCond):
|
---|
569 | # longest likestr first
|
---|
570 | return cmp(len(b.likestr), len(a.likestr))
|
---|
571 | return 0
|
---|
572 | if isinstance(a, ExactCond):
|
---|
573 | return -1
|
---|
574 | if isinstance(b, ExactCond):
|
---|
575 | return 1
|
---|
576 | if isinstance(a, PrefixCond):
|
---|
577 | return -1
|
---|
578 | if isinstance(b, PrefixCond):
|
---|
579 | return 1
|
---|
580 | # leave all unknown condition callables alone as equals
|
---|
581 | return 0
|
---|
582 |
|
---|
583 | conditionlist = conditions.items()
|
---|
584 | conditionlist.sort(cmp_conditions)
|
---|
585 |
|
---|
586 | # Apply conditions to column data to find what we want
|
---|
587 | cur = self.db.cursor()
|
---|
588 | column_num = -1
|
---|
589 | for column, condition in conditionlist:
|
---|
590 | column_num = column_num + 1
|
---|
591 | searchkey = _search_col_data_key(table, column)
|
---|
592 | # speedup: don't linear search columns within loop
|
---|
593 | if column in columns:
|
---|
594 | savethiscolumndata = 1 # save the data for return
|
---|
595 | else:
|
---|
596 | savethiscolumndata = 0 # data only used for selection
|
---|
597 |
|
---|
598 | try:
|
---|
599 | key, data = cur.set_range(searchkey)
|
---|
600 | while key[:len(searchkey)] == searchkey:
|
---|
601 | # extract the rowid from the key
|
---|
602 | rowid = key[-_rowid_str_len:]
|
---|
603 |
|
---|
604 | if not rejected_rowids.has_key(rowid):
|
---|
605 | # if no condition was specified or the condition
|
---|
606 | # succeeds, add row to our match list.
|
---|
607 | if not condition or condition(data):
|
---|
608 | if not matching_rowids.has_key(rowid):
|
---|
609 | matching_rowids[rowid] = {}
|
---|
610 | if savethiscolumndata:
|
---|
611 | matching_rowids[rowid][column] = data
|
---|
612 | else:
|
---|
613 | if matching_rowids.has_key(rowid):
|
---|
614 | del matching_rowids[rowid]
|
---|
615 | rejected_rowids[rowid] = rowid
|
---|
616 |
|
---|
617 | key, data = cur.next()
|
---|
618 |
|
---|
619 | except DBError, dberror:
|
---|
620 | if dberror[0] != DB_NOTFOUND:
|
---|
621 | raise
|
---|
622 | continue
|
---|
623 |
|
---|
624 | cur.close()
|
---|
625 |
|
---|
626 | # we're done selecting rows, garbage collect the reject list
|
---|
627 | del rejected_rowids
|
---|
628 |
|
---|
629 | # extract any remaining desired column data from the
|
---|
630 | # database for the matching rows.
|
---|
631 | if len(columns) > 0:
|
---|
632 | for rowid, rowdata in matching_rowids.items():
|
---|
633 | for column in columns:
|
---|
634 | if rowdata.has_key(column):
|
---|
635 | continue
|
---|
636 | try:
|
---|
637 | rowdata[column] = self.db.get(
|
---|
638 | _data_key(table, column, rowid))
|
---|
639 | except DBError, dberror:
|
---|
640 | if dberror[0] != DB_NOTFOUND:
|
---|
641 | raise
|
---|
642 | rowdata[column] = None
|
---|
643 |
|
---|
644 | # return the matches
|
---|
645 | return matching_rowids
|
---|
646 |
|
---|
647 |
|
---|
648 | def Drop(self, table):
|
---|
649 | """Remove an entire table from the database"""
|
---|
650 | txn = None
|
---|
651 | try:
|
---|
652 | txn = self.env.txn_begin()
|
---|
653 |
|
---|
654 | # delete the column list
|
---|
655 | self.db.delete(_columns_key(table), txn)
|
---|
656 |
|
---|
657 | cur = self.db.cursor(txn)
|
---|
658 |
|
---|
659 | # delete all keys containing this tables column and row info
|
---|
660 | table_key = _search_all_data_key(table)
|
---|
661 | while 1:
|
---|
662 | try:
|
---|
663 | key, data = cur.set_range(table_key)
|
---|
664 | except DBNotFoundError:
|
---|
665 | break
|
---|
666 | # only delete items in this table
|
---|
667 | if key[:len(table_key)] != table_key:
|
---|
668 | break
|
---|
669 | cur.delete()
|
---|
670 |
|
---|
671 | # delete all rowids used by this table
|
---|
672 | table_key = _search_rowid_key(table)
|
---|
673 | while 1:
|
---|
674 | try:
|
---|
675 | key, data = cur.set_range(table_key)
|
---|
676 | except DBNotFoundError:
|
---|
677 | break
|
---|
678 | # only delete items in this table
|
---|
679 | if key[:len(table_key)] != table_key:
|
---|
680 | break
|
---|
681 | cur.delete()
|
---|
682 |
|
---|
683 | cur.close()
|
---|
684 |
|
---|
685 | # delete the tablename from the table name list
|
---|
686 | tablelist = pickle.loads(
|
---|
687 | self.db.get(_table_names_key, txn=txn, flags=DB_RMW))
|
---|
688 | try:
|
---|
689 | tablelist.remove(table)
|
---|
690 | except ValueError:
|
---|
691 | # hmm, it wasn't there, oh well, that's what we want.
|
---|
692 | pass
|
---|
693 | # delete 1st, incase we opened with DB_DUP
|
---|
694 | self.db.delete(_table_names_key, txn)
|
---|
695 | self.db.put(_table_names_key, pickle.dumps(tablelist, 1), txn=txn)
|
---|
696 |
|
---|
697 | txn.commit()
|
---|
698 | txn = None
|
---|
699 |
|
---|
700 | if self.__tablecolumns.has_key(table):
|
---|
701 | del self.__tablecolumns[table]
|
---|
702 |
|
---|
703 | except DBError, dberror:
|
---|
704 | if txn:
|
---|
705 | txn.abort()
|
---|
706 | raise TableDBError, dberror[1]
|
---|