mirror of
				https://github.com/python/cpython.git
				synced 2025-10-25 07:48:51 +00:00 
			
		
		
		
	
		
			
				
	
	
		
			158 lines
		
	
	
	
		
			4.4 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			158 lines
		
	
	
	
		
			4.4 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
| """A dumb and slow but simple dbm clone.
 | |
| 
 | |
| For database spam, spam.dir contains the index (a text file),
 | |
| spam.bak *may* contain a backup of the index (also a text file),
 | |
| while spam.dat contains the data (a binary file).
 | |
| 
 | |
| XXX TO DO:
 | |
| 
 | |
| - seems to contain a bug when updating...
 | |
| 
 | |
| - reclaim free space (currently, space once occupied by deleted or expanded
 | |
| items is never reused)
 | |
| 
 | |
| - support concurrent access (currently, if two processes take turns making
 | |
| updates, they can mess up the index)
 | |
| 
 | |
| - support efficient access to large databases (currently, the whole index
 | |
| is read when the database is opened, and some updates rewrite the whole index)
 | |
| 
 | |
| - support opening for read-only (flag = 'm')
 | |
| 
 | |
| """
 | |
| 
 | |
| import os as _os
 | |
| import __builtin__
 | |
| 
 | |
| _open = __builtin__.open
 | |
| 
 | |
| _BLOCKSIZE = 512
 | |
| 
 | |
| error = IOError                         # For anydbm
 | |
| 
 | |
| class _Database:
 | |
| 
 | |
|     def __init__(self, file, mode):
 | |
|         self._mode = mode
 | |
|         self._dirfile = file + _os.extsep + 'dir'
 | |
|         self._datfile = file + _os.extsep + 'dat'
 | |
|         self._bakfile = file + _os.extsep + 'bak'
 | |
|         # Mod by Jack: create data file if needed
 | |
|         try:
 | |
|             f = _open(self._datfile, 'r')
 | |
|         except IOError:
 | |
|             f = _open(self._datfile, 'w', self._mode)
 | |
|         f.close()
 | |
|         self._update()
 | |
| 
 | |
|     def _update(self):
 | |
|         self._index = {}
 | |
|         try:
 | |
|             f = _open(self._dirfile)
 | |
|         except IOError:
 | |
|             pass
 | |
|         else:
 | |
|             while 1:
 | |
|                 line = f.readline().rstrip()
 | |
|                 if not line: break
 | |
|                 key, (pos, siz) = eval(line)
 | |
|                 self._index[key] = (pos, siz)
 | |
|             f.close()
 | |
| 
 | |
|     def _commit(self):
 | |
|         try: _os.unlink(self._bakfile)
 | |
|         except _os.error: pass
 | |
|         try: _os.rename(self._dirfile, self._bakfile)
 | |
|         except _os.error: pass
 | |
|         f = _open(self._dirfile, 'w', self._mode)
 | |
|         for key, (pos, siz) in self._index.items():
 | |
|             f.write("%s, (%s, %s)\n" % (`key`, `pos`, `siz`))
 | |
|         f.close()
 | |
| 
 | |
|     def __getitem__(self, key):
 | |
|         pos, siz = self._index[key]     # may raise KeyError
 | |
|         f = _open(self._datfile, 'rb')
 | |
|         f.seek(pos)
 | |
|         dat = f.read(siz)
 | |
|         f.close()
 | |
|         return dat
 | |
| 
 | |
|     def _addval(self, val):
 | |
|         f = _open(self._datfile, 'rb+')
 | |
|         f.seek(0, 2)
 | |
|         pos = int(f.tell())
 | |
| ## Does not work under MW compiler
 | |
| ##              pos = ((pos + _BLOCKSIZE - 1) / _BLOCKSIZE) * _BLOCKSIZE
 | |
| ##              f.seek(pos)
 | |
|         npos = ((pos + _BLOCKSIZE - 1) // _BLOCKSIZE) * _BLOCKSIZE
 | |
|         f.write('\0'*(npos-pos))
 | |
|         pos = npos
 | |
| 
 | |
|         f.write(val)
 | |
|         f.close()
 | |
|         return (pos, len(val))
 | |
| 
 | |
|     def _setval(self, pos, val):
 | |
|         f = _open(self._datfile, 'rb+')
 | |
|         f.seek(pos)
 | |
|         f.write(val)
 | |
|         f.close()
 | |
|         return (pos, len(val))
 | |
| 
 | |
|     def _addkey(self, key, (pos, siz)):
 | |
|         self._index[key] = (pos, siz)
 | |
|         f = _open(self._dirfile, 'a', self._mode)
 | |
|         f.write("%s, (%s, %s)\n" % (`key`, `pos`, `siz`))
 | |
|         f.close()
 | |
| 
 | |
|     def __setitem__(self, key, val):
 | |
|         if not type(key) == type('') == type(val):
 | |
|             raise TypeError, "keys and values must be strings"
 | |
|         if not self._index.has_key(key):
 | |
|             (pos, siz) = self._addval(val)
 | |
|             self._addkey(key, (pos, siz))
 | |
|         else:
 | |
|             pos, siz = self._index[key]
 | |
|             oldblocks = (siz + _BLOCKSIZE - 1) / _BLOCKSIZE
 | |
|             newblocks = (len(val) + _BLOCKSIZE - 1) / _BLOCKSIZE
 | |
|             if newblocks <= oldblocks:
 | |
|                 pos, siz = self._setval(pos, val)
 | |
|                 self._index[key] = pos, siz
 | |
|             else:
 | |
|                 pos, siz = self._addval(val)
 | |
|                 self._index[key] = pos, siz
 | |
| 
 | |
|     def __delitem__(self, key):
 | |
|         del self._index[key]
 | |
|         self._commit()
 | |
| 
 | |
|     def keys(self):
 | |
|         return self._index.keys()
 | |
| 
 | |
|     def has_key(self, key):
 | |
|         return self._index.has_key(key)
 | |
| 
 | |
|     def __contains__(self, key):
 | |
|         return self._index.has_key(key)
 | |
| 
 | |
|     def iterkeys(self):
 | |
|         return self._index.iterkeys()
 | |
|     __iter__ = iterkeys
 | |
| 
 | |
|     def __len__(self):
 | |
|         return len(self._index)
 | |
| 
 | |
|     def close(self):
 | |
|         self._commit()
 | |
|         self._index = None
 | |
|         self._datfile = self._dirfile = self._bakfile = None
 | |
| 
 | |
|     def __del__(self):
 | |
|         if self._index is not None:
 | |
|             self._commit()
 | |
| 
 | |
| 
 | |
| 
 | |
| def open(file, flag=None, mode=0666):
 | |
|     # flag, mode arguments are currently ignored
 | |
|     return _Database(file, mode)
 | 
