free_disk.py 2.8 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879
  1. import argparse
  2. import datetime
  3. import logging
  4. import os
  5. import shutil
  6. import re
  7. # https://en.wikipedia.org/wiki/Template:Quantities_of_bytes
  8. DATA_SIZE_UNIT_BYTE_CONVERSION_FACTOR = {
  9. 'B': 1,
  10. 'kB': 10**3,
  11. 'KB': 10**3,
  12. 'MB': 10**6,
  13. 'GB': 10**9,
  14. 'TB': 10**12,
  15. 'KiB': 2**10,
  16. 'MiB': 2**20,
  17. 'GiB': 2**30,
  18. 'TiB': 2**40,
  19. }
  20. def data_size_to_bytes(size_with_unit: str) -> int:
  21. match = re.match(r'^([\d\.]+)\s*([A-Za-z]+)?$', size_with_unit)
  22. if not match:
  23. raise ValueError('Unable to parse data size {!r}'.format(size_with_unit))
  24. unit_symbol = match.group(2)
  25. if unit_symbol:
  26. try:
  27. byte_conversion_factor = DATA_SIZE_UNIT_BYTE_CONVERSION_FACTOR[unit_symbol]
  28. except KeyError:
  29. raise ValueError('Unknown data size unit symbol {!r}'.format(unit_symbol))
  30. else:
  31. byte_conversion_factor = 1
  32. byte_size = float(match.group(1)) * byte_conversion_factor
  33. return int(round(byte_size, 0))
  34. def main():
  35. argparser = argparse.ArgumentParser(
  36. description='Delete files with earliest modification date'
  37. ' until a minimum of --free-bytes are available on the respective disk')
  38. argparser.add_argument('-d', '--debug', action='store_true')
  39. argparser.add_argument('--free-bytes', type=data_size_to_bytes, required=True,
  40. help='examples: 1024, 1024B, 4KiB, 4KB, 2TB')
  41. argparser.add_argument('root_dir_path', metavar='ROOT_DIR')
  42. args = argparser.parse_args()
  43. logging.basicConfig(level=logging.DEBUG if args.debug else logging.INFO,
  44. format='%(asctime)s:%(levelname)s:%(message)s',
  45. datefmt='%Y-%m-%dT%H:%M:%S%z')
  46. logging.debug('Required free bytes: %d', args.free_bytes)
  47. disk_usage = shutil.disk_usage(args.root_dir_path)
  48. logging.debug(disk_usage)
  49. if disk_usage.free >= args.free_bytes:
  50. logging.debug('Requirement already fulfilled')
  51. return
  52. file_paths = [os.path.join(dirpath, filename)
  53. for dirpath, _, filenames in os.walk(args.root_dir_path)
  54. for filename in filenames]
  55. file_mtime_paths = [(os.stat(p).st_mtime, p) for p in file_paths]
  56. file_mtime_paths.sort()
  57. removed_files_counter = 0
  58. last_mtime = None
  59. for file_mtime, file_path in file_mtime_paths:
  60. if shutil.disk_usage(args.root_dir_path).free >= args.free_bytes:
  61. break
  62. os.remove(file_path)
  63. logging.debug('Removed file %s', file_path)
  64. removed_files_counter += 1
  65. last_mtime = file_mtime
  66. if removed_files_counter == 0:
  67. logging.warning('No files to remove')
  68. else:
  69. logging.info('Removed %d file(s) with modification date <= %s', removed_files_counter,
  70. datetime.datetime.utcfromtimestamp(last_mtime).isoformat('T'))
  71. if __name__ == '__main__':
  72. main()