aboutsummaryrefslogtreecommitdiffstats
path: root/bin
diff options
context:
space:
mode:
authorbwarsaw <>2003-12-24 17:00:16 +0000
committerbwarsaw <>2003-12-24 17:00:16 +0000
commit11a8c0b2ca3c8a84ce5c1403c02ca634e07f6dee (patch)
tree1eadaa1fa2fc1f08dae3050fc55fd38cbc064751 /bin
parent556bdb0478011df0345cbd3800c825b022e472ab (diff)
downloadmailman2-11a8c0b2ca3c8a84ce5c1403c02ca634e07f6dee.tar.gz
mailman2-11a8c0b2ca3c8a84ce5c1403c02ca634e07f6dee.tar.xz
mailman2-11a8c0b2ca3c8a84ce5c1403c02ca634e07f6dee.zip
Richard Barrett's script to fix Pipermail archive bloat on existing
archives. Closes SF bug #835332.
Diffstat (limited to 'bin')
-rw-r--r--bin/rb-archfix108
1 files changed, 108 insertions, 0 deletions
diff --git a/bin/rb-archfix b/bin/rb-archfix
new file mode 100644
index 00000000..3e200f46
--- /dev/null
+++ b/bin/rb-archfix
@@ -0,0 +1,108 @@
+#! @PYTHON@
+#
+# Copyright (C) 2003 by the Free Software Foundation, Inc.
+#
+# This program is free software; you can redistribute it and/or
+# modify it under the terms of the GNU General Public License
+# as published by the Free Software Foundation; either version 2
+# of the License, or (at your option) any later version.
+#
+# This program is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+# GNU General Public License for more details.
+#
+# You should have received a copy of the GNU General Public License
+# along with this program; if not, write to the Free Software
+# Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
+
+# Author: Richard Barrett
+
+"""Reduce disk space usage for Pipermail archives.
+
+Usage: %(PROGRAM)s [options] file ...
+
+Where options are:
+ -h / --help
+ Print this help message and exit.
+
+Only use this to 'fix' archive -article database files that have been written
+with Mailman 2.1.3 or earlier and have html_body attributes in them. These
+attributes can cause huge amounts of memory bloat and impact performance for
+high activity lists, particularly those where large text postings are made to
+them.
+
+Example:
+
+%% ls -1 archives/private/*/database/*-article | xargs %(PROGRAM)s
+
+You should run `bin/check_perms -f' after running this script.
+
+You will probably want to delete the -article.bak files created by this script
+when you are satisfied with the results.
+
+This script is provided for convenience purposes only. It isn't supported.
+"""
+
+import os
+import sys
+import getopt
+import marshal
+import cPickle as pickle
+
+# Required to get the right classes for unpickling
+import paths
+from Mailman.i18n import _
+
+PROGRAM = sys.argv[0]
+
+
+
+def usage(code, msg=''):
+ if code:
+ fd = sys.stderr
+ else:
+ fd = sys.stdout
+ print >> fd, _(__doc__)
+ if msg:
+ print >> fd, msg
+ sys.exit(code)
+
+
+
+def main():
+ # get command line arguments
+ try:
+ opts, args = getopt.getopt(sys.argv[1:], 'h', ['help'])
+ except getopt.error, msg:
+ usage(1, msg)
+
+ for opt, arg in opts:
+ if opt in ('-h', '--help'):
+ usage(0)
+
+ for filename in args:
+ print 'processing:', filename
+ fp = open(filename, 'rb')
+ d = marshal.load(fp)
+ fp.close()
+ newd = {}
+ for key, pckstr in d.items():
+ article = pickle.loads(pckstr)
+ try:
+ del article.html_body
+ except AttributeError:
+ pass
+ newd[key] = pickle.dumps(article)
+ fp = open(filename + '.tmp', 'wb')
+ marshal.dump(newd, fp)
+ fp.close()
+ os.rename(filename, filename + '.bak')
+ os.rename(filename + '.tmp', filename)
+
+ print 'You should now run "bin/check_perms -f"'
+
+
+
+if __name__ == '__main__':
+ main()