[Zope-Checkins] CVS: ZODB3/ZODB - fsrecover.py:1.11

Jeremy Hylton jeremy@zope.com
Fri, 23 May 2003 13:33:57 -0400


Update of /cvs-repository/ZODB3/ZODB
In directory cvs.zope.org:/tmp/cvs-serv11971/ZODB

Modified Files:
	fsrecover.py 
Log Message:
Fix some serious bugs in fsrecover.

When a corrupted record is found, it guesses a location for the next
good transaction header.  If the guessed location happened to have a
'c' character at just the right spot, it would think it was at the end
of the file.

Fix in off-by-one bug in scan() that lead to failure.

Do more sanity checks for invalid transaction headers following a
scan.

Use restore() instead of store() to copy data.  This change should
maximize the chance that the recovered storage is identical except for
the damaged records.

Add tests from the trunk and remove test in testFileStorage.


=== ZODB3/ZODB/fsrecover.py 1.10 => 1.11 ===
--- ZODB3/ZODB/fsrecover.py:1.10	Fri May  9 11:06:04 2003
+++ ZODB3/ZODB/fsrecover.py	Fri May 23 13:33:56 2003
@@ -11,8 +11,6 @@
 # FOR A PARTICULAR PURPOSE
 #
 ##############################################################################
-
-
 """Simple script for repairing damaged FileStorage files.
 
 Usage: %s [-f] input output
@@ -94,64 +92,92 @@
 def error(mess, *args):
     raise ErrorFound(mess % args)
 
-def read_transaction_header(file, pos, file_size):
+def read_txn_header(f, pos, file_size, outp, ltid):
     # Read the transaction record
-    file.seek(pos)
-    h = file.read(23)
+    f.seek(pos)
+    h = f.read(23)
     if len(h) < 23:
         raise EOFError
 
     tid, stl, status, ul, dl, el = unpack(">8s8scHHH",h)
     if el < 0: el=t32-el
 
-    tl=u64(stl)
-
-    if status=='c': raise EOFError
+    tl = u64(stl)
 
-    if pos+(tl+8) > file_size:
+    if pos + (tl + 8) > file_size:
         error("bad transaction length at %s", pos)
 
-    if status not in ' up':
-        error('invalid status, %s, at %s', status, pos)
+    if tl < (23 + ul + dl + el):
+        error("invalid transaction length, %s, at %s", tl, pos)
+
+    if ltid and tid < ltid:
+        error("time-stamp reducation %s < %s, at %s", u64(tid), u64(ltid), pos)
+
+    if status == "c":
+        truncate(f, pos, file_size, output)
+        raise EOFError
 
-    if tl < (23+ul+dl+el):
-        error('invalid transaction length, %s, at %s', tl, pos)
+    if status not in " up":
+        error("invalid status, %r, at %s", status, pos)
 
-    tpos=pos
-    tend=tpos+tl
+    tpos = pos
+    tend = tpos + tl
 
-    if status=='u':
+    if status == "u":
         # Undone transaction, skip it
-        file.seek(tend)
-        h = file.read(8)
+        f.seek(tend)
+        h = f.read(8)
         if h != stl:
-            error('inconsistent transaction length at %s', pos)
+            error("inconsistent transaction length at %s", pos)
         pos = tend + 8
-        return pos, None
+        return pos, None, tid
 
     pos = tpos+(23+ul+dl+el)
-    user = file.read(ul)
-    description = file.read(dl)
+    user = f.read(ul)
+    description = f.read(dl)
     if el:
-        try: e=loads(file.read(el))
+        try: e=loads(f.read(el))
         except: e={}
     else: e={}
 
     result = RecordIterator(tid, status, user, description, e, pos, tend,
-                            file, tpos)
-    pos=tend
+                            f, tpos)
+    pos = tend
 
     # Read the (intentionally redundant) transaction length
-    file.seek(pos)
-    h = file.read(8)
+    f.seek(pos)
+    h = f.read(8)
     if h != stl:
         error("redundant transaction length check failed at %s", pos)
     pos += 8
 
-    return pos, result
+    return pos, result, tid
+
+def truncate(f, pos, file_size, outp):
+    """Copy data from pos to end of f to a .trNNN file."""
+
+    i = 0
+    while 1:
+        trname = outp + ".tr%d" % i
+        if os.path.exists(trname):
+            i += 1
+    tr = open(trname, "wb")
+    copy(f, tr, file_size - pos)
+    f.seek(pos)
+    tr.close()
+
+def copy(src, dst, n):
+    while n:
+        buf = src.read(8096)
+        if not buf:
+            break
+        if len(buf) > n:
+            buf = buf[:n]
+        dst.write(buf)
+        n -= len(buf)
 
-def scan(file, pos):
-    """Return a potential transaction location following pos in file.
+def scan(f, pos):
+    """Return a potential transaction location following pos in f.
 
     This routine scans forward from pos looking for the last data
     record in a transaction.  A period '.' always occurs at the end of
@@ -163,30 +189,30 @@
     actually a transaction header.
     """
     while 1:
-        file.seek(pos)
-        data = file.read(8096)
+        f.seek(pos)
+        data = f.read(8096)
         if not data:
             return 0
 
         s = 0
         while 1:
-            l = data.find('.', s)
+            l = data.find(".", s)
             if l < 0:
                 pos += len(data)
                 break
             # If we are less than 8 bytes from the end of the
             # string, we need to read more data.
-            if l > len(data) - 8:
+            s = l + 1
+            if s > len(data) - 8:
                 pos += l
                 break
-            s = l + 1
             tl = u64(data[s:s+8])
             if tl < pos:
                 return pos + s + 8
 
 def iprogress(i):
     if i % 2:
-        print '.',
+        print ".",
     else:
         print (i/2) % 10,
     sys.stdout.flush()
@@ -197,7 +223,7 @@
 
 def main():
     try:
-        opts, (inp, outp) = getopt.getopt(sys.argv[1:], 'fv:pP:')
+        opts, (inp, outp) = getopt.getopt(sys.argv[1:], "fv:pP:")
     except getopt.error:
         die()
         print __doc__ % argv[0]
@@ -205,58 +231,63 @@
     force = partial = verbose = 0
     pack = None
     for opt, v in opts:
-        if opt == '-v':
+        if opt == "-v":
             verbose = int(v)
-        elif opt == '-p':
+        elif opt == "-p":
             partial = 1
-        elif opt == '-f':
+        elif opt == "-f":
             force = 1
-        elif opt == '-P':
+        elif opt == "-P":
             pack = time.time() - float(v)
 
     recover(inp, outp, verbose, partial, force, pack)
 
 def recover(inp, outp, verbose=0, partial=0, force=0, pack=0):
-    print 'Recovering', inp, 'into', outp
+    print "Recovering", inp, "into", outp
 
     if os.path.exists(outp) and not force:
         die("%s exists" % outp)
 
-    file = open(inp, "rb")
-    if file.read(4) != ZODB.FileStorage.packed_version:
+    f = open(inp, "rb")
+    if f.read(4) != ZODB.FileStorage.packed_version:
         die("input is not a file storage")
 
-    file.seek(0,2)
-    file_size = file.tell()
+    f.seek(0,2)
+    file_size = f.tell()
 
     ofs = ZODB.FileStorage.FileStorage(outp, create=1)
     _ts = None
     ok = 1
     prog1 = 0
-    preindex = {}
     undone = 0
 
     pos = 4
+    ltid = None
     while pos:
         try:
-            npos, transaction = read_transaction_header(file, pos, file_size)
+            npos, txn, tid = read_txn_header(f, pos, file_size, outp, ltid)
         except EOFError:
             break
-        except:
-            print "\n%s: %s\n" % sys.exc_info()[:2]
+        except (KeyboardInterrupt, SystemExit):
+            raise
+        except Exception, err:
+            print "error reading txn header:", err
             if not verbose:
                 progress(prog1)
-            pos = scan(file, pos)
+            pos = scan(f, pos)
+            if verbose > 1:
+                print "looking for valid txn header at", pos
             continue
+        ltid = tid
 
-        if transaction is None:
+        if txn is None:
             undone = undone + npos - pos
             pos = npos
             continue
         else:
             pos = npos
 
-        tid = transaction.tid
+        tid = txn.tid
 
         if _ts is None:
             _ts = TimeStamp(tid)
@@ -264,58 +295,59 @@
             t = TimeStamp(tid)
             if t <= _ts:
                 if ok:
-                    print ('Time stamps out of order %s, %s' % (_ts, t))
+                    print ("Time stamps out of order %s, %s" % (_ts, t))
                 ok = 0
                 _ts = t.laterThan(_ts)
                 tid = `_ts`
             else:
                 _ts = t
                 if not ok:
-                    print ('Time stamps back in order %s' % (t))
+                    print ("Time stamps back in order %s" % (t))
                     ok = 1
 
-        if verbose:
-            print 'begin',
-            if verbose > 1:
-                print
-            sys.stdout.flush()
-
-        ofs.tpc_begin(transaction, tid, transaction.status)
+        ofs.tpc_begin(txn, tid, txn.status)
 
         if verbose:
-            print 'begin', pos, _ts,
+            print "begin", pos, _ts,
             if verbose > 1:
                 print
             sys.stdout.flush()
 
         nrec = 0
         try:
-            for r in transaction:
-                oid = r.oid
+            for r in txn:
                 if verbose > 1:
-                    print u64(oid), r.version, len(r.data)
-                pre = preindex.get(oid)
-                s = ofs.store(oid, pre, r.data, r.version, transaction)
-                preindex[oid] = s
+                    if r.data is None:
+                        l = "bp"
+                    else:
+                        l = len(r.data)
+                        
+                    print "%7d %s %s" % (u64(r.oid), l, r.version)
+                s = ofs.restore(r.oid, r.serial, r.data, r.version,
+                                r.data_txn, txn)
                 nrec += 1
-        except:
+        except (KeyboardInterrupt, SystemExit):
+            raise
+        except Exception, err:
             if partial and nrec:
-                ofs._status = 'p'
-                ofs.tpc_vote(transaction)
-                ofs.tpc_finish(transaction)
+                ofs._status = "p"
+                ofs.tpc_vote(txn)
+                ofs.tpc_finish(txn)
                 if verbose:
-                    print 'partial'
+                    print "partial"
             else:
-                ofs.tpc_abort(transaction)
-            print "\n%s: %s\n" % sys.exc_info()[:2]
+                ofs.tpc_abort(txn)
+            print "error copying transaction:", err
             if not verbose:
                 progress(prog1)
-            pos = scan(file, pos)
+            pos = scan(f, pos)
+            if verbose > 1:
+                print "looking for valid txn header at", pos
         else:
-            ofs.tpc_vote(transaction)
-            ofs.tpc_finish(transaction)
+            ofs.tpc_vote(txn)
+            ofs.tpc_finish(txn)
             if verbose:
-                print 'finish'
+                print "finish"
                 sys.stdout.flush()
 
         if not verbose:
@@ -338,7 +370,6 @@
 
     ofs.close()
 
-
-if __name__ == '__main__':
+if __name__ == "__main__":
     main()