From 0e8e831da788bd14e23bd0c9e87b2395f966aeb2 Mon Sep 17 00:00:00 2001 From: Kevin Michel Date: Thu, 7 Nov 2024 01:39:57 +0100 Subject: [PATCH 1/2] fix: don't send all aiokafka log.error to sentry These log events are numerous and costly. When these `log.error` events are related to real error, they cause exceptions which are still properly handled and recorded by Sentry, no need to also send individual events for all the `log.error` in addition to the exceptions. The same logic was already applied for the `kafka` library. --- src/karapace/sentry/sentry_client.py | 2 ++ 1 file changed, 2 insertions(+) diff --git a/src/karapace/sentry/sentry_client.py b/src/karapace/sentry/sentry_client.py index 776214c7f..c4dc99d33 100644 --- a/src/karapace/sentry/sentry_client.py +++ b/src/karapace/sentry/sentry_client.py @@ -41,6 +41,8 @@ def _initialize_sentry(self) -> None: # Don't send library logged errors to Sentry as there is also proper return value or raised exception to calling code from sentry_sdk.integrations.logging import ignore_logger + ignore_logger("aiokafka") + ignore_logger("aiokafka.*") ignore_logger("kafka") ignore_logger("kafka.*") From 88f7185ff1bd3ea8233c7626fa1167809bf9f7be Mon Sep 17 00:00:00 2001 From: Elia Migliore Date: Mon, 12 Feb 2024 20:46:55 +0100 Subject: [PATCH 2/2] fix: harden the order of keys that needs to be serialized --- src/karapace/key_format.py | 32 ++++++++++++++++++++++------ src/karapace/schema_registry_apis.py | 2 +- 2 files changed, 26 insertions(+), 8 deletions(-) diff --git a/src/karapace/key_format.py b/src/karapace/key_format.py index e39d4c49e..64f0e525a 100644 --- a/src/karapace/key_format.py +++ b/src/karapace/key_format.py @@ -5,16 +5,31 @@ See LICENSE for details """ +from collections import OrderedDict from enum import Enum from karapace.typing import ArgJsonObject from karapace.utils import json_encode -from typing import Optional +from types import MappingProxyType +from typing import Final, Optional -SCHEMA_KEY_ORDER = ["keytype", "subject", "version", "magic"] -CONFIG_KEY_ORDER = ["keytype", "subject", "magic"] -NOOP_KEY_ORDER = ["keytype", "magic"] +# used by the OrderedDict for the relative order of keys. +SCHEMA_KEY_ORDER: Final[tuple[str, str, str, str]] = ("keytype", "subject", "version", "magic") +CONFIG_KEY_ORDER: Final[tuple[str, str, str]] = ("keytype", "subject", "magic") +NOOP_KEY_ORDER: Final[tuple[str, str]] = ("keytype", "magic") -CANONICAL_KEY_ORDERS = [SCHEMA_KEY_ORDER, CONFIG_KEY_ORDER, NOOP_KEY_ORDER] +KEY_ORDER = MappingProxyType( + { + tuple(sorted(SCHEMA_KEY_ORDER)): SCHEMA_KEY_ORDER, + tuple(sorted(CONFIG_KEY_ORDER)): CONFIG_KEY_ORDER, + tuple(sorted(NOOP_KEY_ORDER)): NOOP_KEY_ORDER, + } +) + +CANONICAL_KEY_ORDERS: tuple[tuple[str, str, str, str], tuple[str, str, str], tuple[str, str]] = ( + SCHEMA_KEY_ORDER, + CONFIG_KEY_ORDER, + NOOP_KEY_ORDER, +) class KeyMode(Enum): @@ -72,8 +87,11 @@ def format_key( corrected_key["version"] = key["version"] # Magic is the last element corrected_key["magic"] = key["magic"] - return json_encode(corrected_key, binary=True, sort_keys=False, compact=True) + + fixed_order = KEY_ORDER[tuple(sorted(corrected_key.keys()))] + fixed_order_dict = OrderedDict(list(sorted(corrected_key.items(), key=lambda t: fixed_order.index(t[0])))) + return json_encode(fixed_order_dict, binary=True, sort_keys=False, compact=True) def is_key_in_canonical_format(key: ArgJsonObject) -> bool: - return list(key.keys()) in CANONICAL_KEY_ORDERS + return tuple(key.keys()) in CANONICAL_KEY_ORDERS diff --git a/src/karapace/schema_registry_apis.py b/src/karapace/schema_registry_apis.py index fbb8f5a0c..ef778b008 100644 --- a/src/karapace/schema_registry_apis.py +++ b/src/karapace/schema_registry_apis.py @@ -1307,7 +1307,7 @@ async def _forward_request_remote( if auth_header is not None: headers["Authorization"] = auth_header - with async_timeout.timeout(timeout): + async with async_timeout.timeout(timeout): async with func(url, headers=headers, json=body) as response: if response.headers.get("content-type", "").startswith(JSON_CONTENT_TYPE): resp_content = await response.json()