Source code for sensai.util.logging

import atexit
import logging as lg
import sys
import time
from abc import ABC, abstractmethod
from datetime import datetime
from io import StringIO
from logging import *
from typing import List, Callable, Optional, TypeVar, TYPE_CHECKING, Generic

from .time import format_duration

if TYPE_CHECKING:
    import pandas as pd


log = getLogger(__name__)

LOG_DEFAULT_FORMAT = '%(levelname)-5s %(asctime)-15s %(name)s:%(funcName)s:%(lineno)d - %(message)s'
T = TypeVar("T")
THandler = TypeVar("THandler", bound=Handler)

# Holds the log format that is configured by the user (using function `configure`), such
# that it can be reused in other places
_logFormat = LOG_DEFAULT_FORMAT

# User-configured callback which is called after logging is configured via function `configure`
_configureCallbacks: List[Callable[[], None]] = []


[docs]def remove_log_handlers(): """ Removes all current log handlers """ logger = getLogger() while logger.hasHandlers(): logger.removeHandler(logger.handlers[0])
[docs]def remove_log_handler(handler): getLogger().removeHandler(handler)
[docs]def is_log_handler_active(handler): return handler in getLogger().handlers
[docs]def is_enabled() -> bool: """ :return: True if logging is enabled (at least one log handler exists) """ return getLogger().hasHandlers()
[docs]def set_configure_callback(callback: Callable[[], None], append: bool = True) -> None: """ Configures a function to be called when logging is configured, e.g. through :func:`configure, :func:`run_main` or :func:`run_cli`. A typical use for the callback is to configure the logging behaviour of packages, setting appropriate log levels. :param callback: the function to call :param append: whether to append to the list of callbacks; if False, any existing callbacks will be removed """ global _configureCallbacks if not append: _configureCallbacks = [] _configureCallbacks.append(callback)
# noinspection PyShadowingBuiltins
[docs]def configure(format=LOG_DEFAULT_FORMAT, level=lg.DEBUG): """ Configures logging to stdout with the given format and log level, also configuring the default log levels of some overly verbose libraries as well as some pandas output options. :param format: the log format :param level: the minimum log level """ global _logFormat _logFormat = format remove_log_handlers() basicConfig(level=level, format=format, stream=sys.stdout) getLogger("matplotlib").setLevel(lg.INFO) getLogger("urllib3").setLevel(lg.INFO) getLogger("msal").setLevel(lg.INFO) try: import pandas as pd pd.set_option('display.max_colwidth', 255) except ImportError: pass for callback in _configureCallbacks: callback()
# noinspection PyShadowingBuiltins
[docs]def run_main(main_fn: Callable[..., T], format=LOG_DEFAULT_FORMAT, level=lg.DEBUG) -> T: """ Configures logging with the given parameters, ensuring that any exceptions that occur during the execution of the given function are logged. Logs two additional messages, one before the execution of the function, and one upon its completion. :param main_fn: the function to be executed :param format: the log message format :param level: the minimum log level :return: the result of `main_fn` """ configure(format=format, level=level) log.info("Starting") try: result = main_fn() log.info("Done") return result except Exception as e: log.error("Exception during script execution", exc_info=e)
# noinspection PyShadowingBuiltins
[docs]def run_cli(main_fn: Callable[..., T], format: str = LOG_DEFAULT_FORMAT, level: int = lg.DEBUG) -> Optional[T]: """ Configures logging with the given parameters and runs the given main function as a CLI using `jsonargparse` (which is configured to also parse attribute docstrings, such that dataclasses can be used as function arguments). Using this function requires that `jsonargparse` and `docstring_parser` be available. Like `run_main`, two additional log messages will be logged (at the beginning and end of the execution), and it is ensured that all exceptions will be logged. :param main_fn: the function to be executed :param format: the log message format :param level: the minimum log level :return: the result of `main_fn` """ from jsonargparse import set_docstring_parse_options, CLI set_docstring_parse_options(attribute_docstrings=True) return run_main(lambda: CLI(main_fn), format=format, level=level)
[docs]def datetime_tag() -> str: """ :return: a string tag for use in log file names which contains the current date and time (compact but readable) """ return datetime.now().strftime('%Y%m%d-%H%M%S')
_fileLoggerPaths: List[str] = [] _isAtExitReportFileLoggerRegistered = False def _at_exit_report_file_logger(): for path in _fileLoggerPaths: print(f"A log file was saved to {path}")
[docs]def add_file_logger(path, append=True, register_atexit=True) -> FileHandler: global _isAtExitReportFileLoggerRegistered log.info(f"Logging to {path} ...") mode = "a" if append else "w" handler = FileHandler(path, mode=mode) handler.setFormatter(Formatter(_logFormat)) Logger.root.addHandler(handler) _fileLoggerPaths.append(path) if not _isAtExitReportFileLoggerRegistered and register_atexit: atexit.register(_at_exit_report_file_logger) _isAtExitReportFileLoggerRegistered = True return handler
[docs]class MemoryStreamHandler(StreamHandler): def __init__(self, stream: StringIO): super().__init__(stream)
[docs] def get_log(self) -> str: stream: StringIO = self.stream return stream.getvalue()
[docs]def add_memory_logger() -> MemoryStreamHandler: """ Adds an in-memory logger, i.e. all log statements are written to a memory buffer which can be retrieved using the handler's `get_log` method. """ handler = MemoryStreamHandler(StringIO()) handler.setFormatter(Formatter(_logFormat)) Logger.root.addHandler(handler) return handler
[docs]class StopWatch: """ Represents a stop watch for timing an execution. Constructing an instance starts the stopwatch. """ def __init__(self, start=True): self.start_time = time.time() self._elapsed_secs = 0.0 self.is_running = start
[docs] def reset(self, start=True): """ Resets the stopwatch, setting the elapsed time to zero. :param start: whether to start the stopwatch immediately """ self.start_time = time.time() self._elapsed_secs = 0.0 self.is_running = start
[docs] def restart(self): """ Resets the stopwatch (setting the elapsed time to zero) and restarts it immediately """ self.reset(start=True)
def _get_elapsed_time_since_last_start(self): if self.is_running: return time.time() - self.start_time else: return 0
[docs] def pause(self): """ Pauses the stopwatch. It can be resumed via method 'resume'. """ self._elapsed_secs += self._get_elapsed_time_since_last_start() self.is_running = False
[docs] def resume(self): """ Resumes the stopwatch (assuming that it is currently paused). If the stopwatch is not paused, the method has no effect (and a warning is logged). """ if not self.is_running: self.start_time = time.time() self.is_running = True else: log.warning("Stopwatch is already running (resume has not effect)")
[docs] def get_elapsed_time_secs(self) -> float: """ Gets the total elapsed time, in seconds, on this stopwatch. :return: the elapsed time in seconds """ return self._elapsed_secs + self._get_elapsed_time_since_last_start()
[docs] def get_elapsed_timedelta(self) -> "pd.Timedelta": """ :return: the elapsed time as a pandas.Timedelta object """ return pd.Timedelta(self.get_elapsed_time_secs(), unit="s")
[docs] def get_elapsed_time_string(self) -> str: """ :return: a string representation of the elapsed time """ secs = self.get_elapsed_time_secs() if secs < 60: return f"{secs:.3f} seconds" else: try: import pandas as pd return str(pd.Timedelta(secs, unit="s")) except ImportError: return format_duration(secs)
[docs]class StopWatchManager: """ A singleton which manages a pool of named stopwatches, such that executions to be timed by referring to a name only - without the need for a limited scope. """ _instance = None
[docs] @classmethod def get_instance(cls): if cls._instance is None: cls._instance = StopWatchManager(42) return cls._instance
def __init__(self, secret): if secret != 42: raise Exception("Use only the singleton instance via getInstance") self._stopWatches = {}
[docs] def start(self, name): self._stopWatches[name] = time.time()
[docs] def stop(self, name) -> float: """ :param name: the name of the stopwatch :return: the time that has passed in seconds """ time_passed_secs = time.time() - self._stopWatches[name] del self._stopWatches[name] return time_passed_secs
[docs] def is_running(self, name): return name in self._stopWatches
[docs]class LogTime: """ An execution time logger which can be conveniently applied using a with-statement - in order to log the executing time of the respective with-block. """ def __init__(self, name, enabled=True, logger: Logger = None): """ :param name: the name of the event whose time is to be logged upon completion as "<name> completed in <time>" :param enabled: whether the logging is actually enabled; can be set to False to disable logging without necessitating changes to client code :param logger: the logger to use; if None, use the logger of LogTime's module """ self.name = name self.enabled = enabled self.stopwatch = None self.logger = logger if logger is not None else log
[docs] def start(self): """ Starts the stopwatch """ self.stopwatch = StopWatch() if self.enabled: self.logger.info(f"{self.name} starting ...")
[docs] def stop(self): """ Stops the stopwatch and logs the time taken (if enabled) """ if self.stopwatch is not None and self.enabled: self.logger.info(f"{self.name} completed in {self.stopwatch.get_elapsed_time_string()}")
def __exit__(self, exc_type, exc_value, traceback): self.stop() def __enter__(self): self.start() return self
[docs]class LoggerContext(Generic[THandler], ABC): """ Base class for context handlers to be used in conjunction with Python's `with` statement. """ def __init__(self, enabled=True): """ :param enabled: whether to actually perform any logging. This switch allows the with statement to be applied regardless of whether logging shall be enabled. """ self.enabled = enabled self._log_handler = None @abstractmethod def _create_log_handler(self) -> THandler: pass def __enter__(self) -> Optional[THandler]: if self.enabled: self._log_handler = self._create_log_handler() return self._log_handler def __exit__(self, exc_type, exc_value, traceback): if self._log_handler is not None: remove_log_handler(self._log_handler)
[docs]class FileLoggerContext(LoggerContext[FileHandler]): """ A context handler to be used in conjunction with Python's `with` statement which enables file-based logging. """ def __init__(self, path: str, append=True, enabled=True): """ :param path: the path to the log file :param append: whether to append in case the file already exists; if False, always create a new file. :param enabled: whether to actually perform any logging. This switch allows the with statement to be applied regardless of whether logging shall be enabled. """ self.path = path self.append = append super().__init__(enabled=enabled) def _create_log_handler(self) -> FileHandler: return add_file_logger(self.path, append=self.append, register_atexit=False)
[docs]class MemoryLoggerContext(LoggerContext[MemoryStreamHandler]): """ A context handler to be used in conjunction with Python's `with` statement which enables in-memory logging. """ def _create_log_handler(self) -> MemoryStreamHandler: return add_memory_logger()
[docs]class LoggingDisabledContext: """ A context manager that will temporarily disable logging """ def __init__(self, highest_level=CRITICAL): """ :param highest_level: the highest level to disable """ self._highest_level = highest_level self._previous_level = None def __enter__(self): self._previous_level = lg.root.manager.disable lg.disable(self._highest_level) def __exit__(self, exc_type, exc_value, traceback): lg.disable(self._previous_level)
# noinspection PyShadowingBuiltins
[docs]class FallbackHandler(Handler): """ A log handler which applies the given handler only if the root logger has no defined handlers (or no handlers other than this fallback handler itself) """ def __init__(self, handler: Handler, level=NOTSET): """ :param handler: the handler to which messages shall be passed on :param level: the minimum level to output; if NOTSET, pass on everything """ super().__init__(level=level) self._handler = handler
[docs] def emit(self, record): root_handlers = getLogger().handlers if len(root_handlers) == 0 or (len(root_handlers) == 1 and root_handlers[0] == self): self._handler.emit(record)