#!/usr/bin/env python # # Erases the text of every file in a BDB repository # import sys, os import skel, svnfs def main(): if len(sys.argv) == 2: dbhome = os.path.join(sys.argv[1], 'db') for i in ('', 'uuids', 'revisions', 'transactions', 'representations', 'strings', 'changes', 'copies', 'nodes'): if not os.path.exists(os.path.join(dbhome, i)): sys.stderr.write("%s: '%s' is not a valid bdb svn repository\n" % (sys.argv[0], sys.argv[1])) sys.exit(1) else: sys.stderr.write("Usage: %s \n" % sys.argv[0]) sys.exit(1) print("WARNING!: This program will destroy all text data in the subversion") print("repository '%s'" % sys.argv[1]) print("Do not proceed unless this is a *COPY* of your real repository") print("If this is really what you want to do, " \ "type 'YESERASE' and press Return") confirmation = raw_input("Confirmation string> ") if confirmation != "YESERASE": print("Cancelled - confirmation string not matched") sys.exit(0) print("Opening database environment...") cur = None ctx = svnfs.Ctx(dbhome) try: cur = ctx.nodes_db.cursor() nodecount = 0 newrep = skel.Rep() newrep.str = "empty" empty_fulltext_rep_skel = newrep.unparse() del newrep ctx.strings_db['empty'] = "" rec = cur.first() while rec: if rec[0] != "next-key": if (nodecount % 10000 == 0) and nodecount != 0: print("Processed %d nodes..." % nodecount) nodecount += 1 node = skel.Node(rec[1]) if node.kind == "file": rep = skel.Rep(ctx.reps_db[node.datarep]) if rep.kind == "fulltext": if rep.str in ctx.strings_db: del ctx.strings_db[rep.str] ctx.reps_db[node.datarep] = empty_fulltext_rep_skel else: for w in rep.windows: if w.str in ctx.strings_db: del ctx.strings_db[w.str] ctx.reps_db[node.datarep] = empty_fulltext_rep_skel rec = cur.next() print("Processed %d nodes" % nodecount) finally: if cur: cur.close() ctx.close() print("Done") if __name__ == '__main__': main()