2012-01-24 13:38:42 +00:00
|
|
|
#!/usr/bin/env python
|
|
|
|
# Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
|
|
|
|
#
|
|
|
|
# Use of this source code is governed by a BSD-style license
|
|
|
|
# that can be found in the LICENSE file in the root of the source
|
|
|
|
# tree. An additional intellectual property rights grant can be found
|
|
|
|
# in the file PATENTS. All contributing project authors may
|
|
|
|
# be found in the AUTHORS file in the root of the source tree.
|
|
|
|
|
2012-04-16 14:41:11 +00:00
|
|
|
__author__ = 'ivinnichenko@webrtc.org (Illya Vinnichenko)'
|
2012-01-24 13:38:42 +00:00
|
|
|
|
2012-02-24 12:12:31 +00:00
|
|
|
"""This script will prune sufficiently old files and empty directories.
|
|
|
|
|
|
|
|
The algorithm is to look into the provided directory and delete any files
|
|
|
|
that is older than x days, recursively. Then all empty directories will be
|
|
|
|
deleted (we can't look at timestamps there since the act of deleting a file
|
|
|
|
will refresh the directory's timestamp).
|
|
|
|
|
|
|
|
Note: This script has only been tested on Linux.
|
|
|
|
"""
|
|
|
|
|
2012-01-24 13:38:42 +00:00
|
|
|
from optparse import OptionParser
|
|
|
|
import os
|
|
|
|
import sys
|
|
|
|
import time
|
|
|
|
|
2012-02-23 12:34:01 +00:00
|
|
|
# The path is considered whitelisted if any of these entries appear
|
2012-01-24 13:38:42 +00:00
|
|
|
# at some point in the path
|
2012-04-16 14:41:11 +00:00
|
|
|
WHITELIST = ['buildbot', 'buildbot.tac', 'Makefile', 'master.cfg',
|
|
|
|
'public_html', 'slaves.cfg', 'state.sqlite', 'twistd.pid']
|
2012-01-24 13:38:42 +00:00
|
|
|
|
|
|
|
|
|
|
|
def is_whitelisted(path):
|
2012-04-16 14:41:11 +00:00
|
|
|
'''Check if file is whitelisted.
|
2012-01-24 13:38:42 +00:00
|
|
|
|
2012-02-24 12:12:31 +00:00
|
|
|
Args:
|
|
|
|
path: file path.
|
2012-04-16 14:41:11 +00:00
|
|
|
'''
|
2012-01-24 13:38:42 +00:00
|
|
|
for entry in WHITELIST:
|
|
|
|
if entry in path:
|
|
|
|
return True
|
|
|
|
return False
|
|
|
|
|
|
|
|
|
2012-02-24 12:12:31 +00:00
|
|
|
def delete_directory(directory):
|
|
|
|
try:
|
|
|
|
os.rmdir(directory)
|
|
|
|
return True
|
|
|
|
except OSError as exception:
|
2012-04-16 14:41:11 +00:00
|
|
|
if 'not empty' in str(exception):
|
2012-03-15 11:03:02 +00:00
|
|
|
# This is normal, ignore it
|
|
|
|
pass
|
|
|
|
else:
|
2012-04-18 09:47:39 +00:00
|
|
|
print >> sys.stderr, ('Could not remove directory %s: reason %s.' %
|
|
|
|
(directory, exception))
|
2012-02-24 12:12:31 +00:00
|
|
|
return False
|
|
|
|
|
|
|
|
|
|
|
|
def delete_file(file):
|
|
|
|
try:
|
|
|
|
os.remove(file)
|
|
|
|
except OSError as exception:
|
2012-04-18 09:47:39 +00:00
|
|
|
print >> sys.stderr, ('Unexpectedly failed to remove file %s: reason %s.' %
|
|
|
|
(file, exception))
|
2012-02-24 12:12:31 +00:00
|
|
|
|
|
|
|
|
|
|
|
def log_removal(file_or_directory, time_stamp, verbose):
|
|
|
|
if verbose:
|
2012-04-16 14:41:11 +00:00
|
|
|
str_stamp = time.strftime('%a, %d %b %Y %H:%M:%S +0000',
|
2012-02-24 12:12:31 +00:00
|
|
|
time.gmtime(time_stamp))
|
2012-04-16 14:41:11 +00:00
|
|
|
print 'Removing [%s], stamped on %s' % (file_or_directory, str_stamp)
|
2012-02-24 12:12:31 +00:00
|
|
|
|
2012-01-24 13:38:42 +00:00
|
|
|
|
2012-02-24 12:12:31 +00:00
|
|
|
def remove_old_files_and_directories(path, num_days, verbose, skip_dirs):
|
2012-04-16 14:41:11 +00:00
|
|
|
'''Removes all files under path that are older than num_days days.
|
2012-02-24 12:12:31 +00:00
|
|
|
The algorithm also tried to delete all directories, except for those who
|
|
|
|
contain files that are sufficiently new.
|
|
|
|
|
|
|
|
Implementation note: it doesn't make sense to look at timestamps for
|
|
|
|
directories since their timestamps are updated when a file is deleted.
|
|
|
|
|
|
|
|
Args:
|
|
|
|
path: The starting point.
|
|
|
|
num_days: days limit for removal.
|
|
|
|
verbose: print every cmd?
|
2012-04-16 14:41:11 +00:00
|
|
|
'''
|
2012-01-24 13:38:42 +00:00
|
|
|
current_time = time.time()
|
2012-02-24 12:12:31 +00:00
|
|
|
limit = 60 * 60 * 24 * num_days
|
|
|
|
|
|
|
|
# Walk bottom-up so directories are deleted in the right order.
|
|
|
|
for root, directories, files in os.walk(path, topdown=False):
|
|
|
|
for file in files:
|
|
|
|
current_file = os.path.join(root, file)
|
|
|
|
time_stamp = os.stat(current_file).st_mtime
|
|
|
|
|
2012-01-24 13:38:42 +00:00
|
|
|
if is_whitelisted(current_file):
|
|
|
|
continue
|
2012-02-24 12:12:31 +00:00
|
|
|
|
2012-01-24 13:38:42 +00:00
|
|
|
if (current_time - time_stamp) > limit:
|
2012-02-24 12:12:31 +00:00
|
|
|
delete_file(current_file)
|
|
|
|
log_removal(current_file, time_stamp, verbose)
|
|
|
|
|
|
|
|
if not skip_dirs:
|
|
|
|
for directory in directories:
|
|
|
|
current_directory = os.path.join(root, directory)
|
|
|
|
time_stamp = os.stat(current_directory).st_mtime
|
|
|
|
if delete_directory(current_directory):
|
|
|
|
log_removal(current_directory, time_stamp, verbose)
|
2012-01-24 13:38:42 +00:00
|
|
|
|
|
|
|
|
|
|
|
def main():
|
2012-04-16 14:41:11 +00:00
|
|
|
usage = 'usage: %prog -p <base path> -n <number of days> [-q] [-d]'
|
2012-01-24 13:38:42 +00:00
|
|
|
parser = OptionParser(usage)
|
2012-04-16 14:41:11 +00:00
|
|
|
parser.add_option('-p', '--path', dest='cleanup_path', help='base directory')
|
|
|
|
parser.add_option('-n', '--num_days', dest='num_days', help='number of days')
|
|
|
|
parser.add_option('-q', '--quiet',
|
|
|
|
action='store_false', dest='verbose', default=True,
|
|
|
|
help='do not print status messages to stdout')
|
|
|
|
parser.add_option('-d', '--delete-dirs-too',
|
|
|
|
action='store_false', dest='skip_dirs', default=True,
|
|
|
|
help='number of days')
|
2012-01-24 13:38:42 +00:00
|
|
|
|
2012-04-18 09:47:39 +00:00
|
|
|
options, unused_args = parser.parse_args()
|
2012-01-24 13:38:42 +00:00
|
|
|
if not options.cleanup_path:
|
2012-04-18 09:47:39 +00:00
|
|
|
sys.exit('You must specify base directory')
|
2012-01-24 13:38:42 +00:00
|
|
|
if not options.num_days:
|
2012-04-18 09:47:39 +00:00
|
|
|
sys.exit('You must specify number of days old')
|
2012-02-24 12:12:31 +00:00
|
|
|
|
|
|
|
if options.verbose:
|
2012-04-16 14:41:11 +00:00
|
|
|
print 'Cleaning up everything in %s older than %s days' % (
|
2012-02-24 12:12:31 +00:00
|
|
|
options.cleanup_path, options.num_days)
|
|
|
|
remove_old_files_and_directories(options.cleanup_path, int(options.num_days),
|
|
|
|
options.verbose, options.skip_dirs)
|
2012-01-24 13:38:42 +00:00
|
|
|
|
2012-04-16 14:41:11 +00:00
|
|
|
if __name__ == '__main__':
|
2012-01-24 13:38:42 +00:00
|
|
|
main()
|