Clone directory (recursive) and restore any changes made to it.
You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

115 line
3.7 KiB

  1. #!/usr/bin/env python3
  2. import os
  3. import logging
  4. import string
  5. import hashlib
  6. import time
  7. import shutil
  8. class Cloner:
  9. def __init__(self, targetDir: str, backupDir: str):
  10. self.targetDir = targetDir
  11. self.backupDir = backupDir
  12. self.interval = 1
  13. def handleDir(self, dirPath: str):
  14. backupDirPath = dirPath.replace(self.targetDir, self.backupDir)
  15. if not os.path.isdir(backupDirPath):
  16. os.mkdir(backupDirPath)
  17. with os.scandir(dirPath) as it:
  18. for entry in it:
  19. if entry.is_dir():
  20. self.handleDir(entry.path)
  21. elif entry.is_file():
  22. self.handleFile(entry.path)
  23. def handleFile(self, targetFileName: str):
  24. cloneFileName = targetFileName.replace(self.targetDir, self.backupDir)
  25. cloneHashFileName = cloneFileName + '.md5'
  26. if os.path.exists(cloneFileName):
  27. with open(cloneHashFileName, 'r') as cloneHashFile, open(targetFileName, 'rb') as targetFile:
  28. cloneHashFileContent = cloneHashFile.read()
  29. targetFileContent = targetFile.read()
  30. realHash = hashlib.md5(targetFileContent).hexdigest()
  31. if realHash != cloneHashFileContent:
  32. shutil.copyfile(cloneFileName, targetFileName)
  33. logging.warning(
  34. '{file} failed check, restoring...'.format(file=targetFileName))
  35. else:
  36. logging.info('{file} is fine'.format(file=targetFileName))
  37. else:
  38. logging.warning(
  39. '{file} is a new file, added to backup dir'.format(file=targetFileName))
  40. shutil.copyfile(targetFileName, cloneFileName)
  41. with open(cloneHashFileName, 'w') as cloneHashFile, open(targetFileName, 'rb') as targetFile:
  42. targetFileContent = targetFile.read()
  43. cloneHashFile.write(hashlib.md5(targetFileContent).hexdigest())
  44. def setLog(self, logFileName: str):
  45. logFormatter = logging.Formatter(
  46. fmt="[%(asctime)s][%(levelname)s] %(message)s",
  47. datefmt='%d-%b-%y %H:%M:%S')
  48. rootLogger = logging.getLogger()
  49. fileHandler = logging.FileHandler(logFileName, mode='a')
  50. fileHandler.setFormatter(logFormatter)
  51. rootLogger.addHandler(fileHandler)
  52. # # uncomment this to enable console logging
  53. # consoleHandler = logging.StreamHandler()
  54. # consoleHandler.setFormatter(logFormatter)
  55. # rootLogger.addHandler(consoleHandler)
  56. rootLogger.setLevel(logging.WARNING)
  57. def setInterval(self, interval: int):
  58. self.interval = interval
  59. def start(self):
  60. while True:
  61. self.handleDir(self.targetDir)
  62. time.sleep(5)
  63. if __name__ == "__main__":
  64. import argparse
  65. parser = argparse.ArgumentParser()
  66. parser.add_argument(
  67. '--target',
  68. metavar='PATH',
  69. type=str,
  70. required=True,
  71. help='directory to clone and monitor')
  72. parser.add_argument(
  73. '--backup',
  74. metavar='PATH',
  75. type=str,
  76. required=True,
  77. help='backup directory to store clone'
  78. )
  79. parser.add_argument(
  80. '--interval',
  81. metavar='SECOND',
  82. type=int,
  83. default=1,
  84. help='interval in second(s) which the scripts run, default is 1'
  85. )
  86. parser.add_argument(
  87. '--log',
  88. metavar='LOGFILE',
  89. type=str,
  90. default='/var/log/py-dir-watcher/log.txt',
  91. help='specify custom logfile target, default is \'/var/log/py-dir-watcher/log.txt\' '
  92. )
  93. args = parser.parse_args()
  94. app = Cloner(args.target, args.backup)
  95. app.setLog(args.log)
  96. app.setInterval(args.interval)
  97. app.start()