[Zope-Checkins] CVS: StandaloneZODB/ZODB - FileStorage.py:1.88
Jeremy Hylton
jeremy@zope.com
Fri, 29 Mar 2002 18:54:00 -0500
Update of /cvs-repository/StandaloneZODB/ZODB
In directory cvs.zope.org:/tmp/cvs-serv20868
Modified Files:
FileStorage.py
Log Message:
Break up transactionalUndo() into possibly understandable chunks.
transactionalUndo() does argument checking and locking. It calls
_transactional_undo(), which finds the right transaction record. It calls
_txn_undo_write(), which writes the data records.
Add a summary comment above undoLog() that explains how the
transaction_id is created and used.
=== StandaloneZODB/ZODB/FileStorage.py 1.87 => 1.88 ===
return self._file.read(8)
-
def _transactionalUndoRecord(self, oid, pos, serial, pre, version):
"""Get the indo information for a data record
@@ -979,7 +978,6 @@
version, packed non-version data pointer, and current
position. If the pickle is true, then the data pointer must
be 0, but the pickle can be empty *and* the pointer 0.
-
"""
copy=1 # Can we just copy a data pointer
@@ -1035,6 +1033,32 @@
raise UndoError('Some data were modified by a later transaction')
+ # undoLog() returns a description dict that includes an id entry.
+ # The id is opaque to the client, but encodes information that
+ # uniquely identifies a transaction in the storage. The id is a
+ # base64 encoded string, where the components of the string are:
+ # - the transaction id
+ # - the packed file position of the transaction record
+ # - the oid of an object modified by the transaction
+
+ # The file position is sufficient in most cases, but doesn't work
+ # if the id is used after a pack and may not work if used with
+ # replicated storages. If the file position is incorrect, the oid
+ # can be used for a relatively efficient search for the
+ # transaction record. FileStorage keeps an index mapping oids to
+ # file positions, but do notes have a transaction id to file
+ # offset index. The oid index maps to the most recent revision of
+ # the object. Transactional undo must follow back pointers until
+ # it finds the correct transaction record,
+
+ # This approach fails if the transaction record has no data
+ # records. It's not clear if that is possible, but it may be for
+ # commitVersion and abortVersion.
+
+ # The file offset also supports non-transactional undo, which
+ # won't work after a pack and isn't supported by replicated
+ # storages.
+
def undoLog(self, first=0, last=-20, filter=None):
if last < 0:
last = first - last + 1
@@ -1073,28 +1097,6 @@
e = loads(read(el))
except:
pass
- # We now need an encoded id that isn't dependent on file
- # position, because it will break after a pack, and in the
- # face of replication, while the transaction and data records
- # may be identical (as viewed from the storage interface),
- # file positions may be meaningless across replicas.
- #
- # We'd love to just give the tid, but FS makes it expensive to
- # go from tid to transaction record. :( However, if the txn
- # has data records, then we can encode the oid of one of the
- # objects affected by the txn. Then we can use the index to
- # find the current revision of the object, follow a
- # back-pointer to find its most-current txn, and then follow
- # the txns back until we find a match. Seems like the best we
- # can do w/o a persistent tid->filepos mapping.
- #
- # Note: if the txn has no data records, we're screwed. Punt
- # on that for now.
- #
- # Note that we're still encoding the transaction position
- # in the transaction ID in order to support non-transactional
- # undo. This can be removed as soon as non-transactional
- # undo is removed.
next = read(8)
# next is either the redundant txn length - 8, or an oid
if next == tl:
@@ -1134,113 +1136,128 @@
self._lock_acquire()
try:
- # As seen in undoLog() below, transaction_id encodes the tid and
- # possibly the oid of the first object in the transaction record.
- # transaction_id will be of length 16 if there were objects
- # affected by the txn, and 8 if there weren't (e.g. abortVersion()
- # and commitVersion()). In the latter case, we could still find
- # the transaction through an expensive search of the file, but
- # we're punting on that for now.
- transaction_id = base64.decodestring(transaction_id + '\n')
- tid = transaction_id[:8]
- oid = transaction_id[16:]
- if oid == '' or not self._index.has_key(oid):
- # We can't get the position of the transaction easily.
- # Note that there is a position encoded in the
- # transaction_id at [8:16], but it can't be used reliably
- # across multiple file storages and thus breaks
- # transactional integrity.
- raise UndoError, 'Undoing a non-object affecting transaction'
- # Find the file position for the current revision of this object,
- # and search back for the beginning of its transaction record
- pos = self._index[oid]
- ostloc = p64(self._pos)
- here = self._pos + (self._tfile.tell() + self._thl)
- while 1:
- self._file.seek(pos)
- h = self._file.read(DATA_HDR_LEN)
- doid,serial,prev,tpos,vlen,plen = unpack('>8s8s8s8sH8s', h)
- tpos = U64(tpos)
- self._file.seek(tpos)
- # Read transaction id to see if we've got a match
- thistid = self._file.read(8)
- if thistid == tid:
- break # Yeee ha!
- # Keep looking
- pos = U64(prev)
- if not pos:
- # We never found the right transaction
- raise UndoError, 'Invalid undo transaction id'
- # We're sitting at the transaction we want to undo, but let's move
- # the file pointer back to the start of the txn record.
+ return self._transactional_undo(transaction_id)
+ finally:
+ self._lock_release()
+
+ def _transactional_undo(self, transaction_id):
+ # As seen in undoLog() below, transaction_id encodes the tid and
+ # possibly the oid of the first object in the transaction record.
+ # transaction_id will be of length 16 if there were objects
+ # affected by the txn, and 8 if there weren't (e.g. abortVersion()
+ # and commitVersion()). In the latter case, we could still find
+ # the transaction through an expensive search of the file, but
+ # we're punting on that for now.
+ transaction_id = base64.decodestring(transaction_id + '\n')
+ tid = transaction_id[:8]
+ pos = U64(transaction_id[8:16])
+ # XXX
+ oid = transaction_id[16:]
+ if oid == '' or not self._index.has_key(oid):
+ # We can't get the position of the transaction easily.
+ # Note that there is a position encoded in the
+ # transaction_id at [8:16], but it can't be used reliably
+ # across multiple file storages and thus breaks
+ # transactional integrity.
+ raise UndoError, 'Undoing a non-object affecting transaction'
+ # Find the file position for the current revision of this object,
+ # and search back for the beginning of its transaction record
+ pos = self._index[oid]
+ ostloc = p64(self._pos)
+ here = self._pos + (self._tfile.tell() + self._thl)
+ while 1:
+ self._file.seek(pos)
+ h = self._file.read(DATA_HDR_LEN)
+ doid, serial, prev, tpos, vlen, plen = \
+ unpack('>8s8s8s8sH8s', h)
+ tpos = U64(tpos)
self._file.seek(tpos)
- h = self._file.read(TRANS_HDR_LEN)
- if len(h) != TRANS_HDR_LEN or h[:8] != tid:
- raise UndoError, 'Invalid undo transaction id'
- if h[16] == 'u':
- return
- if h[16] != ' ':
- raise UndoError, 'non-undoable transaction'
- tl = U64(h[8:16])
- ul, dl, el = struct.unpack(">HHH", h[17:TRANS_HDR_LEN])
- tend = tpos + tl
- pos = tpos + (TRANS_HDR_LEN + ul + dl + el)
- tindex = {}
- failures = {} # keep track of failures, cause we may succeed later
- failed = failures.has_key
- # Read the data records for this transaction
- while pos < tend:
- self._file.seek(pos)
- h = self._file.read(DATA_HDR_LEN)
- oid, serial, sprev, stloc, vlen, splen = \
- struct.unpack(">8s8s8s8sH8s", h)
- if failed(oid):
- del failures[oid] # second chance!
- plen = U64(splen)
- prev = U64(sprev)
- if vlen:
- dlen = DATA_VERSION_HDR_LEN + vlen + (plen or 8)
- self._file.seek(16, 1)
- version = self._file.read(vlen)
+ # Read transaction id to see if we've got a match
+ thistid = self._file.read(8)
+ if thistid == tid:
+ break # Yeee ha!
+ # Keep looking
+ pos = U64(prev)
+ if not pos:
+ # We never found the right transaction
+ raise UndoError('Invalid undo transaction id')
+ # We're sitting at the transaction we want to undo, but let's move
+ # the file pointer back to the start of the txn record.
+ tindex = self._txn_undo_write(tpos, tid, ostloc, here)
+ self._tindex.update(tindex)
+ return tindex.keys()
+
+ def _txn_undo_write(self, tpos, tid, ostloc, here):
+ # a helper function to write the data records for transactional undo
+ self._file.seek(tpos)
+ h = self._file.read(TRANS_HDR_LEN)
+ # XXX jer: don't think the second test is needed at this point
+ if len(h) != TRANS_HDR_LEN or h[:8] != tid:
+ raise UndoError('Invalid undo transaction id')
+ if h[16] == 'u':
+ return
+ if h[16] != ' ':
+ raise UndoError('non-undoable transaction')
+ tl = U64(h[8:16])
+ ul, dl, el = struct.unpack(">HHH", h[17:TRANS_HDR_LEN])
+ tend = tpos + tl
+ pos = tpos + (TRANS_HDR_LEN + ul + dl + el)
+ tindex = {}
+ failures = {} # keep track of failures, cause we may succeed later
+ failed = failures.has_key
+ # Read the data records for this transaction
+ while pos < tend:
+ self._file.seek(pos)
+ h = self._file.read(DATA_HDR_LEN)
+ oid, serial, sprev, stloc, vlen, splen = \
+ struct.unpack(">8s8s8s8sH8s", h)
+ if failed(oid):
+ del failures[oid] # second chance!
+ plen = U64(splen)
+ prev = U64(sprev)
+ if vlen:
+ dlen = DATA_VERSION_HDR_LEN + vlen + (plen or 8)
+ self._file.seek(16, 1)
+ version = self._file.read(vlen)
+ else:
+ dlen = DATA_HDR_LEN + (plen or 8)
+ version = ''
+
+ try:
+ p, prev, v, snv, ipos = self._transactionalUndoRecord(
+ oid, pos, serial, prev, version)
+ except UndoError, v:
+ # Don't fail right away. We may be redeemed later!
+ failures[oid] = v
+ else:
+ plen =len(p)
+ self._tfile.write(pack(">8s8s8s8sH8s",
+ oid, self._serial, p64(ipos),
+ ostloc, len(v), p64(plen)))
+ if v:
+ vprev=self._tvindex.get(v, 0) or self._vindex.get(v, 0)
+ self._tfile.write(snv + p64(vprev) + v)
+ self._tvindex[v] = here
+ odlen = DATA_VERSION_HDR_LEN + len(v)+(plen or 8)
else:
- dlen = DATA_HDR_LEN + (plen or 8)
- version = ''
+ odlen = DATA_HDR_LEN+(plen or 8)
- try:
- p, prev, v, snv, ipos = self._transactionalUndoRecord(
- oid, pos, serial, prev, version)
- except UndoError, v:
- # Don't fail right away. We may be redeemed later!
- failures[oid] = v
+ if p:
+ self._tfile.write(p)
else:
- plen =len(p)
- self._tfile.write(pack(">8s8s8s8sH8s",
- oid, self._serial, p64(ipos),
- ostloc, len(v), p64(plen)))
- if v:
- vprev=self._tvindex.get(v, 0) or self._vindex.get(v, 0)
- self._tfile.write(snv + p64(vprev) + v)
- self._tvindex[v]=here
- odlen = DATA_VERSION_HDR_LEN + len(v)+(plen or 8)
- else:
- odlen = DATA_HDR_LEN+(plen or 8)
-
- if p:
- self._tfile.write(p)
- else:
- self._tfile.write(p64(prev))
- tindex[oid]=here
- here=here+odlen
-
- pos=pos+dlen
- if pos > tend:
- raise UndoError, 'non-undoable transaction'
-
- if failures: raise UndoError(failures)
- self._tindex.update(tindex)
- return tindex.keys()
+ self._tfile.write(p64(prev))
+ tindex[oid] = here
+ here += odlen
- finally: self._lock_release()
+ pos=pos+dlen
+ if pos > tend:
+ raise UndoError, 'non-undoable transaction'
+
+ if failures:
+ raise UndoError(failures)
+
+ return tindex
+
def versionEmpty(self, version):
if not version: