1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
|
#!/usr/bin/python -S
#
# Copyright 2009-2011 Canonical Ltd. This software is licensed under the
# GNU Affero General Public License version 3 (see the file LICENSE).
# pylint: disable-msg=C0103,W0403
"""Librarian garbage collector.
This script is run on the Librarian server to merge duplicate files,
remove expired files from the file system and clean up unreachable
rows in the database.
"""
__metaclass__ = type
import logging
import _pythonpath
from lp.services.config import config
from lp.services.database.lpstorm import IStore
from lp.services.librarian.model import LibraryFileAlias
from lp.services.librarianserver import librariangc
from lp.services.scripts.base import LaunchpadCronScript
class LibrarianGC(LaunchpadCronScript):
def add_my_options(self):
self.parser.add_option(
'', "--skip-duplicates", action="store_true", default=False,
dest="skip_duplicates",
help="Skip duplicate LibraryFileContent merging"
)
self.parser.add_option(
'', "--skip-aliases", action="store_true", default=False,
dest="skip_aliases",
help="Skip unreferenced LibraryFileAlias removal"
)
self.parser.add_option(
'', "--skip-content", action="store_true", default=False,
dest="skip_content",
help="Skip unreferenced LibraryFileContent removal"
)
self.parser.add_option(
'', "--skip-blobs", action="store_true", default=False,
dest="skip_blobs",
help="Skip removing expired TemporaryBlobStorage rows"
)
self.parser.add_option(
'', "--skip-files", action="store_true", default=False,
dest="skip_files",
help="Skip removing files on disk with no database references"
" or flagged for deletion."
)
self.parser.add_option(
'', "--skip-expiry", action="store_true", default=False,
dest="skip_expiry",
help="Skip expiring aliases with an expiry date in the past."
)
def main(self):
librariangc.log = self.logger
if self.options.loglevel <= logging.DEBUG:
librariangc.debug = True
# XXX wgrant 2011-09-18 bug=853066: Using Storm's raw connection
# here is wrong. We should either create our own or use
# Store.execute or cursor() and the transaction module.
conn = IStore(LibraryFileAlias)._connection._raw_connection
# Refuse to run if we have significant clock skew between the
# librarian and the database.
librariangc.confirm_no_clock_skew(conn)
# Note that each of these next steps will issue commit commands
# as appropriate to make this script transaction friendly
if not self.options.skip_expiry:
librariangc.expire_aliases(conn)
if not self.options.skip_content:
# First sweep.
librariangc.delete_unreferenced_content(conn)
if not self.options.skip_blobs:
librariangc.delete_expired_blobs(conn)
if not self.options.skip_duplicates:
librariangc.merge_duplicates(conn)
if not self.options.skip_aliases:
librariangc.delete_unreferenced_aliases(conn)
if not self.options.skip_content:
# Second sweep.
librariangc.delete_unreferenced_content(conn)
if not self.options.skip_files:
librariangc.delete_unwanted_files(conn)
if __name__ == '__main__':
script = LibrarianGC('librarian-gc',
dbuser=config.librarian_gc.dbuser)
script.lock_and_run(isolation='autocommit')
|