diff options
author | Martin Fischer <martin@push-f.com> | 2025-03-22 11:47:54 +0100 |
---|---|---|
committer | Martin Fischer <martin@push-f.com> | 2025-03-23 23:36:40 +0100 |
commit | e451a31ed7a0d5fa268a2065906c6fb803e6ae26 (patch) | |
tree | 8dde16820972653c6b67e08b4e2319c43aa18db1 |
initial commitv0.0.1
-rw-r--r-- | .gitignore | 11 | ||||
-rw-r--r-- | LICENSE | 19 | ||||
-rw-r--r-- | README.md | 57 | ||||
-rw-r--r-- | default.nix | 19 | ||||
-rwxr-xr-x | example.py | 26 | ||||
-rw-r--r-- | logformat/__init__.py | 282 | ||||
-rw-r--r-- | logformat/py.typed | 0 | ||||
-rw-r--r-- | pyproject.toml | 25 | ||||
-rwxr-xr-x | test_logformat.py | 222 |
9 files changed, 661 insertions, 0 deletions
diff --git a/.gitignore b/.gitignore new file mode 100644 index 0000000..64a852a --- /dev/null +++ b/.gitignore @@ -0,0 +1,11 @@ +*.pyc +*.egg-info/ + +# created by `pip install . --config-settings editable_mode=compat` +build/ + +# created by `python3 -m build` +dist/ + +# created by `nix-build` +result @@ -0,0 +1,19 @@ +Copyright (c) 2025 Martin Fischer + +Permission is hereby granted, free of charge, to any person obtaining a copy +of this software and associated documentation files (the "Software"), to deal +in the Software without restriction, including without limitation the rights +to use, copy, modify, merge, publish, distribute, sublicense, and/or sell +copies of the Software, and to permit persons to whom the Software is +furnished to do so, subject to the following conditions: + +The above copyright notice and this permission notice shall be included in all +copies or substantial portions of the Software. + +THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR +IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, +FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE +AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER +LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, +OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE +SOFTWARE. diff --git a/README.md b/README.md new file mode 100644 index 0000000..78bbda9 --- /dev/null +++ b/README.md @@ -0,0 +1,57 @@ +# logformat - logfmt logging for Python + +* implements the same value escaping as the [logfmt library] used by Grafana Loki +* implements a `logging.Formatter` so it works with any library using the standard library logging +* implements a convenience wrapper around `logging.Logging` for specifying structured fields via `kwargs` + +```python +import logging + +import logformat + +logfmt_handler = logging.StreamHandler() +logfmt_handler.setFormatter(logformat.LogfmtFormatter()) +logging.basicConfig(handlers=[logfmt_handler], level=logging.INFO) + +logger = logformat.get_logger() + +logger.warning("this seems off", some_id=33) +``` + +Will output a line like: + +``` +time=2025-03-23T06:21:36Z level=warning msg="this seems off" some_id=33 +``` + +`exc_info` and `stack_info` are supported via `backtrace=True` and `stack=True` +(which will add same-named fields). + +In the main method of a script you should always catch any exception and log +them as errors, so that unexpected errors show up properly in your log file. +This library makes this easy by providing a `log_uncaught` decorator: + +```python +logger = logformat.get_logger() + +@logger.log_uncaught +def run(): + # your script + ... +``` + +This library intentionally doesn't provide any pretty terminal output but the +produced logs can be viewed with the [logfmt CLI] (since that tool again uses +the [logfmt library] that this library is compatible with). + +## Alternatives + +* structlog's `get_logger` returns `Any`. + While there's a typed alternative that's a bit of a footgun. + +* logfmter doesn't include the time by default, names the time field `when` by default + and the level field `at` by default, doesn't use ISO dates by default + and isn't compatible with the Go [logfmt library] as of March 2025 + +[logfmt library]: https://github.com/go-logfmt/logfmt +[logfmt CLI]: https://github.com/TheEdgeOfRage/logfmt diff --git a/default.nix b/default.nix new file mode 100644 index 0000000..07331d7 --- /dev/null +++ b/default.nix @@ -0,0 +1,19 @@ +{ pkgs ? import <nixpkgs> {} }: +with pkgs.python313Packages; + +buildPythonPackage rec { + pname = "logformat"; + version = "git"; + src = ./.; + pyproject = true; + + build-system = [ + setuptools + ]; + + disabled = pythonOlder "3.13"; + + installCheckPhase = '' + python ${./test_logformat.py} + ''; +} diff --git a/example.py b/example.py new file mode 100755 index 0000000..0892117 --- /dev/null +++ b/example.py @@ -0,0 +1,26 @@ +#!/usr/bin/env python3 +import json +import logging + +import logformat +import requests + + +logfmt_handler = logging.StreamHandler() +logfmt_handler.setFormatter(logformat.LogfmtFormatter()) +logging.basicConfig(handlers=[logfmt_handler], level=logging.DEBUG) + + +logger = logformat.get_logger() + +requests.get('http://example.com') + +logger.debug("what's happening") +logger.info("something's happening") +logger.warning("this seems off", some_id=33) +logger.error("oh no") + +try: + json.loads("maybe") +except: + logger.error("failed to decode", traceback=True) diff --git a/logformat/__init__.py b/logformat/__init__.py new file mode 100644 index 0000000..4af5c46 --- /dev/null +++ b/logformat/__init__.py @@ -0,0 +1,282 @@ +import asyncio +import base64 +import datetime +import functools +import json +import logging +import time +from typing import Callable, Never, cast + + +class LogfmtFormatter(logging.Formatter): + converter = time.gmtime + + def __init__(self, process_id=False, process_name=False, thread_id=False, thread_name=False): + """Initializes a logfmt formatter.""" + self._process_id = process_id + self._process_name = process_name + self._thread_id = thread_id + self._thread_name = thread_name + + def format(self, record): + fields: dict = { + "time": self.formatTime(record, "%Y-%m-%dT%H:%M:%SZ"), + "level": record.levelname.lower(), + } + + if record.name != "root": + # omitting logger=root for readability + fields['logger'] = record.name + + fields['msg'] = record.getMessage() + + for k, v in record.__dict__.items(): + # using getattr because of https://github.com/python/typeshed/issues/12136 + if k in getattr(logging.LogRecord, "__static_attributes__"): + continue + if k in ('time', 'msg'): + continue + + # This mirrors the logic of https://github.com/go-logfmt/logfmt/blob/main/encode.go. + k = ''.join(c for c in k if c > ' ' and c not in '="') + if k == '': + continue + + fields[k] = v + + if self._process_id: + fields['process_id'] = record.process + if self._process_name: + fields['process_name'] = record.processName + if self._thread_id: + fields['thread_id'] = record.thread + if self._thread_name: + fields['thread_name'] = record.threadName + if record.taskName: + fields['task'] = record.taskName + if record.exc_info: + fields['traceback'] = self.formatException(record.exc_info) + if record.stack_info: + fields['stack'] = self.formatStack(record.stack_info) + + return ' '.join(f'{k}={_fmt_value(v)}' for k, v in fields.items()) + + +def get_logger(name: str | None = None): + return _Logger(logging.getLogger(name)) + + +def _fmt_value(obj): + if obj is None: + value = "null" + elif isinstance(obj, bool): + value = str(obj).lower() + elif isinstance(obj, bytes): + value = base64.b64encode(obj).decode() + elif isinstance(obj, datetime.datetime): + value = obj.isoformat().replace('+00:00', 'Z') + else: + value = str(obj) + + # This mirrors the logic of https://github.com/go-logfmt/logfmt/blob/main/encode.go. + if any(c <= ' ' or c in '="' for c in value): + return json.dumps(value, ensure_ascii=False) + else: + return value + + +_never: Never = cast(Never, None) + + +class _Logger: + def __init__(self, logger: logging.Logger): + self._logger = logger + + def debug( + self, + msg: str, + traceback=False, + stack=False, + time=_never, + level=_never, + process_id=_never, + process_name=_never, + thread_id=_never, + thread_name=_never, + task=_never, + # Logger.makeRecord raises if any of logging.LogRecord.__static_attributes__ are in extra. + args=_never, + created=_never, + exc_info=_never, + exc_text=_never, + filename=_never, + funcName=_never, + levelname=_never, + levelno=_never, + module=_never, + msecs=_never, + name=_never, + pathname=_never, + process=_never, + processName=_never, + relativeCreated=_never, + stack_info=_never, + taskName=_never, + thread=_never, + threadName=_never, + **kwargs, + ): + self._logger.debug(msg, exc_info=traceback, stack_info=stack, extra=kwargs) + + def info( + self, + msg: str, + traceback=False, + stack=False, + time=_never, + level=_never, + process_id=_never, + process_name=_never, + thread_id=_never, + thread_name=_never, + task=_never, + # Logger.makeRecord raises if any of logging.LogRecord.__static_attributes__ are in extra. + args=_never, + created=_never, + exc_info=_never, + exc_text=_never, + filename=_never, + funcName=_never, + levelname=_never, + levelno=_never, + module=_never, + msecs=_never, + name=_never, + pathname=_never, + process=_never, + processName=_never, + relativeCreated=_never, + stack_info=_never, + taskName=_never, + thread=_never, + threadName=_never, + **kwargs, + ): + self._logger.info(msg, exc_info=traceback, stack_info=stack, extra=kwargs) + + def warning( + self, + msg: str, + traceback=False, + stack=False, + time=_never, + level=_never, + process_id=_never, + process_name=_never, + thread_id=_never, + thread_name=_never, + task=_never, + # Logger.makeRecord raises if any of logging.LogRecord.__static_attributes__ are in extra. + args=_never, + created=_never, + exc_info=_never, + exc_text=_never, + filename=_never, + funcName=_never, + levelname=_never, + levelno=_never, + module=_never, + msecs=_never, + name=_never, + pathname=_never, + process=_never, + processName=_never, + relativeCreated=_never, + stack_info=_never, + taskName=_never, + thread=_never, + threadName=_never, + **kwargs, + ): + self._logger.warning(msg, exc_info=traceback, stack_info=stack, extra=kwargs) + + def error( + self, + msg: str, + traceback=False, + stack=False, + time=_never, + level=_never, + process_id=_never, + process_name=_never, + thread_id=_never, + thread_name=_never, + task=_never, + # Logger.makeRecord raises if any of logging.LogRecord.__static_attributes__ are in extra. + args=_never, + created=_never, + exc_info=_never, + exc_text=_never, + filename=_never, + funcName=_never, + levelname=_never, + levelno=_never, + module=_never, + msecs=_never, + name=_never, + pathname=_never, + process=_never, + processName=_never, + relativeCreated=_never, + stack_info=_never, + taskName=_never, + thread=_never, + threadName=_never, + **kwargs, + ): + self._logger.error(msg, exc_info=traceback, stack_info=stack, extra=kwargs) + + # intentionally omitting critical ... just use errors + + def log_uncaught(self, f: Callable): + """ + Wraps the given function to log an uncaught exception as an error with a traceback and raise SystemExit(1). + + Meant to be used as a decorator on the main function. + """ + + @functools.wraps(f) + def sync_wrapper(*args, **kwargs): + try: + return f(*args, **kwargs) + except Exception as exc: + exc_str = self._stringify_exception(exc) + self.error(f"unexpected exception: {exc_str}", traceback=True) + raise SystemExit(1) + + @functools.wraps(f) + async def async_wrapper(*args, **kwargs): + try: + return await f(*args, **kwargs) + except Exception as exc: + exc_str = self._stringify_exception(exc) + self.error(f"unexpected exception: {exc_str}", traceback=True) + raise SystemExit(1) + + if asyncio.iscoroutinefunction(f): + return async_wrapper + else: + return sync_wrapper + + def _stringify_exception(self, exc: Exception): + try: + return str(exc) + except Exception: + self.warning("while logging unexpected exception str(exc) raised", traceback=True) + + try: + return repr(exc) + except Exception: + self.warning("while logging unexpected exception repr(exc) raised", traceback=True) + + return '??? (str and repr failed)' diff --git a/logformat/py.typed b/logformat/py.typed new file mode 100644 index 0000000..e69de29 --- /dev/null +++ b/logformat/py.typed diff --git a/pyproject.toml b/pyproject.toml new file mode 100644 index 0000000..7640b73 --- /dev/null +++ b/pyproject.toml @@ -0,0 +1,25 @@ +[project] +name = "logformat" +version = "0.0.1" +authors = [ + { name="Martin Fischer", email="martin@push-f.com" }, +] +description = "logfmt logging for Python" +requires-python = ">=3.13" # because of __static_attributes__ + +readme = "README.md" +classifiers = [ + "Programming Language :: Python :: 3", + "Operating System :: OS Independent", +] +license = "MIT" +license-files = ["LICENSE"] + +[project.urls] +repository = "https://git.push-f.com/logformat" + +[tool.setuptools] +packages = ["logformat"] + +[tool.black] +line-length = 100 diff --git a/test_logformat.py b/test_logformat.py new file mode 100755 index 0000000..cbcc14d --- /dev/null +++ b/test_logformat.py @@ -0,0 +1,222 @@ +#!/usr/bin/env python3 +import asyncio +import contextlib +import datetime +import functools +import io +import logging +import textwrap +import unittest +import unittest.mock + +import logformat + + +def set_up(level=logging.DEBUG): + stream = io.StringIO() + logfmt_handler = logging.StreamHandler(stream) + logfmt_handler.setFormatter(logformat.LogfmtFormatter()) + logging.basicConfig(handlers=[logfmt_handler], level=level, force=True) + return stream + + +# We're not using pytest here because pytest messes with the logging config, +# setting it's own handlers, apparently even when disabling the pytest logging +# plugin with `-p no:logging`. +test_suite = unittest.TestSuite() + + +def test(test): + @functools.wraps(test) + def wrapped_test(): + t = unittest.TestCase() + with unittest.mock.patch("time.time_ns", return_value=1742634901036965331): + test(t) + + test_suite.addTest(unittest.FunctionTestCase(wrapped_test)) + + +@test +def test_logformat(t: unittest.TestCase): + stream = set_up() + logger = logformat.get_logger() + logger.debug("what's happening") + logger.info("something's happening") + logger.warning("this seems off") + logger.error("oh no") + t.assertEqual( + stream.getvalue(), + textwrap.dedent( + ''' + time=2025-03-22T09:15:01Z level=debug msg="what's happening" + time=2025-03-22T09:15:01Z level=info msg="something's happening" + time=2025-03-22T09:15:01Z level=warning msg="this seems off" + time=2025-03-22T09:15:01Z level=error msg="oh no" + ''' + ).lstrip(), + ) + + +@test +def test_escaping(t: unittest.TestCase): + stream = set_up() + logger = logformat.get_logger() + logger.warning(" \t\n\x00='\"‽") + t.assertEqual( + stream.getvalue(), + 'time=2025-03-22T09:15:01Z level=warning msg=" \\t\\n\\u0000=\'\\"‽"\n', + ) + + +@test +def test_fmtlogger_extra_uses_str(t: unittest.TestCase): + class Foo: + def __str__(self): + return "hello!" + + stream = set_up() + logger = logformat.get_logger() + logger.warning("test", value=Foo()) + t.assertEqual( + stream.getvalue(), + 'time=2025-03-22T09:15:01Z level=warning msg=test value=hello!\n', + ) + + +@test +def test_fmtlogger_extra_none(t: unittest.TestCase): + stream = set_up() + logger = logformat.get_logger() + logger.warning("test", helpful_info=None) + t.assertEqual( + stream.getvalue(), + 'time=2025-03-22T09:15:01Z level=warning msg=test helpful_info=null\n', + ) + + +@test +def test_fmtlogger_extra_bool(t: unittest.TestCase): + stream = set_up() + logger = logformat.get_logger() + logger.warning("test", off_by_one=True) + t.assertEqual( + stream.getvalue(), + 'time=2025-03-22T09:15:01Z level=warning msg=test off_by_one=true\n', + ) + + +@test +def test_fmtlogger_extra_datetime(t: unittest.TestCase): + stream = set_up() + logger = logformat.get_logger() + logger.warning( + "test", + expiry=datetime.datetime(2025, 3, 22, 15, 30, 00, 00, tzinfo=datetime.UTC), + ) + t.assertEqual( + stream.getvalue(), + 'time=2025-03-22T09:15:01Z level=warning msg=test expiry=2025-03-22T15:30:00Z\n', + ) + + +@test +def test_stdlib_logger(t: unittest.TestCase): + stream = set_up() + logger = logging.getLogger() + logger.debug("what's happening %s", 1234) + logger.info("something's happening") + logger.warning("this seems off") + logger.error("oh no") + logger.critical("aaaaaaaaah!") + t.assertEqual( + stream.getvalue(), + textwrap.dedent( + ''' + time=2025-03-22T09:15:01Z level=debug msg="what's happening 1234" + time=2025-03-22T09:15:01Z level=info msg="something's happening" + time=2025-03-22T09:15:01Z level=warning msg="this seems off" + time=2025-03-22T09:15:01Z level=error msg="oh no" + time=2025-03-22T09:15:01Z level=critical msg=aaaaaaaaah! + ''' + ).lstrip(), + ) + + +@test +def test_log_uncaught_sync_returns(t: unittest.TestCase): + stream = set_up() + + logger = logformat.get_logger() + + @logger.log_uncaught + def run(): + return 42 + + t.assertEqual(run(), 42) + t.assertEqual(stream.getvalue(), "") + + +@test +def test_log_uncaught_sync_raises(t: unittest.TestCase): + stream = set_up() + + logger = logformat.get_logger() + + @logger.log_uncaught + def run(): + 5 / 0 + + with t.assertRaises(SystemExit), stub_traceback(): + run() + + t.assertEqual( + stream.getvalue(), + 'time=2025-03-22T09:15:01Z level=error msg="unexpected exception: division by zero" traceback="stub traceback"\n', + ) + + +@test +def test_log_uncaught_async_returns(t: unittest.TestCase): + stream = set_up(level=logging.INFO) + + logger = logformat.get_logger() + + @logger.log_uncaught + async def run(): + return 42 + + t.assertEqual(asyncio.run(run()), 42) + t.assertEqual(stream.getvalue(), "") + + +@test +def test_log_uncaught_async_raises(t: unittest.TestCase): + stream = set_up(level=logging.INFO) + + logger = logformat.get_logger() + + @logger.log_uncaught + async def run(): + 5 / 0 + + with t.assertRaises(SystemExit), stub_traceback(): + asyncio.run(run()) + + t.assertEqual( + stream.getvalue(), + 'time=2025-03-22T09:15:01Z level=error msg="unexpected exception: division by zero" task=Task-4 traceback="stub traceback"\n', + ) + + +@contextlib.contextmanager +def stub_traceback(): + def stub_print_exception(*args, **kwargs): + kwargs['file'].write('stub traceback') + + with unittest.mock.patch("traceback.print_exception", stub_print_exception): + yield + + +if __name__ == "__main__": + runner = unittest.TextTestRunner() + runner.run(test_suite) |