#!/usr/bin/env python import threading import time from watchdog.observers.polling import PollingObserver from dm.common.utility.loggingManager import LoggingManager from dm.common.utility.configurationManager import ConfigurationManager from dm.common.objects.observedFile import ObservedFile from dm.common.utility.objectUtility import ObjectUtility from dm.common.utility.singleton import Singleton from dm.common.utility.threadingUtility import ThreadingUtility from dm.common.processing.fileProcessingManager import FileProcessingManager from dmFileSystemEventHandler import DmFileSystemEventHandler class FileSystemObserver(threading.Thread,Singleton): CONFIG_SECTION_NAME = 'FileSystemObserver' MIN_FILE_PROCESSING_DELAY_IN_SECONDS_KEY = 'minfileprocessingdelayinseconds' FILE_SYSTEM_EVENT_TIMEOUT_IN_SECONDS_KEY = 'filesystemeventtimeoutinseconds' FILE_SYSTEM_OBSERVER_AGENT_KEY = 'filesystemobserveragent' # Singleton. __instanceLock = threading.RLock() __instance = None def __init__(self): FileSystemObserver.__instanceLock.acquire() try: if FileSystemObserver.__instance: return FileSystemObserver.__instance = self threading.Thread.__init__(self) self.setName('FileSystemObserverThread') self.logger = LoggingManager.getInstance().getLogger(self.__class__.__name__) self.logger.debug('Initializing') self.lock = threading.RLock() self.eventFlag = threading.Event() self.exitFlag = False self.observedFileMap = {} self.__configure() self.fileProcessingManager = FileProcessingManager.getInstance() self.logger.debug('Initialization complete') finally: FileSystemObserver.__instanceLock.release() def __configure(self): cm = ConfigurationManager.getInstance() configItems = cm.getConfigItems(FileSystemObserver.CONFIG_SECTION_NAME) self.logger.debug('Got config items: %s' % configItems) self.minFileProcessingDelayInSeconds = int(cm.getConfigOption(FileSystemObserver.CONFIG_SECTION_NAME, FileSystemObserver.MIN_FILE_PROCESSING_DELAY_IN_SECONDS_KEY)) self.logger.debug('Minimum file processing delay: %s seconds' % self.minFileProcessingDelayInSeconds) self.fileSystemEventTimeoutInSeconds = int(cm.getConfigOption(FileSystemObserver.CONFIG_SECTION_NAME, FileSystemObserver.FILE_SYSTEM_EVENT_TIMEOUT_IN_SECONDS_KEY)) self.logger.debug('File system event timeout: %s seconds' % self.fileSystemEventTimeoutInSeconds) agentClass = cm.getConfigOption(FileSystemObserver.CONFIG_SECTION_NAME, FileSystemObserver.FILE_SYSTEM_OBSERVER_AGENT_KEY) (moduleName,className,constructor) = cm.getModuleClassConstructorTuple(agentClass) self.logger.debug('Creating file system observer agent instance of class %s' % className) self.fileSystemObserverAgent = ObjectUtility.createObjectInstance(moduleName, className, constructor) self.fileSystemObserverAgent.setFileSystemObserver(self) @ThreadingUtility.synchronize def startObservingPath(self, dataDirectory, experiment): self.logger.debug('Agent is starting observer for %s' % dataDirectory) self.fileSystemObserverAgent.startObservingPath(dataDirectory, experiment) @ThreadingUtility.synchronize def stopObservingPath(self, dataDirectory, experiment): self.logger.debug('Agent is stopping observer for %s' % dataDirectory) self.fileSystemObserverAgent.stopObservingPath(dataDirectory, experiment) @ThreadingUtility.synchronize def fileUpdated(self, filePath, dataDirectory, experiment): observedFile = self.observedFileMap.get(filePath, ObservedFile(filePath=filePath, dataDirectory=dataDirectory, experiment=experiment)) observedFile.setLastUpdatedTimestampToNow() self.observedFileMap[filePath] = observedFile self.logger.debug('Observed file updated: %s', observedFile) @ThreadingUtility.synchronize def checkObservedFilesForProcessing(self): now = time.time() filePathsForProcessing = [] for (filePath,observedFile) in self.observedFileMap.items(): timestamp = observedFile.get('lastUpdateTimestamp') deltaT = now - timestamp if deltaT > self.minFileProcessingDelayInSeconds: self.logger.debug('File %s was last modified %s seconds ago, will process it.' % (filePath, deltaT)) filePathsForProcessing.append(filePath) return filePathsForProcessing @ThreadingUtility.synchronize def processFile(self, filePath): self.logger.debug('Processing file %s' % filePath) observedFile = self.observedFileMap.get(filePath) if observedFile is not None: del self.observedFileMap[filePath] self.fileProcessingManager.processFile(observedFile) @ThreadingUtility.synchronize def start(self): self.logger.debug('Starting file observer thread') threading.Thread.start(self) self.logger.debug('Starting file observer agent') self.fileSystemObserverAgent.start() def run(self): self.logger.debug('Starting thread: %s' % self.getName()) while True: if self.exitFlag: self.logger.debug('Exit flag set, %s done' % self.getName()) break try: self.logger.debug('Checking observed files') filePathsForProcessing = self.checkObservedFilesForProcessing() for filePath in filePathsForProcessing: self.processFile(filePath) except Exception, ex: self.logger.exception(ex) self.eventFlag.wait(timeout=self.fileSystemEventTimeoutInSeconds) @ThreadingUtility.synchronize def stop(self): self.logger.debug('Stopping file observer agent') self.fileSystemObserverAgent.stop() self.logger.debug('Stopping file observer thread') self.exitFlag = True self.eventFlag.set() self.logger.debug('Event is set, joining thread') threading.Thread.join(self) self.logger.debug('Module stopped') @ThreadingUtility.synchronize def setEvent(self): self.eventFlag.set() @ThreadingUtility.synchronize def clearEvent(self): self.eventFlag.clear() #################################################################### # Testing if __name__ == '__main__': fp = FileSystemObserver.getInstance() fp.start() time.sleep(30) fp.stop()