|
| 1 | +import base64 |
| 2 | +import logging |
| 3 | +from binascii import Error as BinAsciiError |
| 4 | +from datetime import datetime |
| 5 | +from typing import Dict, List, Optional, Type, Union |
| 6 | + |
| 7 | +from pydantic import BaseModel, validator |
| 8 | + |
| 9 | +from aws_lambda_powertools.utilities.parser.types import Literal |
| 10 | + |
| 11 | +SERVERS_DELIMITER = "," |
| 12 | + |
| 13 | +logger = logging.getLogger(__name__) |
| 14 | + |
| 15 | + |
| 16 | +def _base64_decode(value: str) -> bytes: |
| 17 | + try: |
| 18 | + logger.debug("Decoding base64 Kafka record item before parsing") |
| 19 | + return base64.b64decode(value) |
| 20 | + except (BinAsciiError, TypeError): |
| 21 | + raise ValueError("base64 decode failed") |
| 22 | + |
| 23 | + |
| 24 | +def _bytes_to_string(value: bytes) -> str: |
| 25 | + try: |
| 26 | + return value.decode("utf-8") |
| 27 | + except (BinAsciiError, TypeError): |
| 28 | + raise ValueError("base64 UTF-8 decode failed") |
| 29 | + |
| 30 | + |
| 31 | +class KafkaRecordModel(BaseModel): |
| 32 | + topic: str |
| 33 | + partition: int |
| 34 | + offset: int |
| 35 | + timestamp: datetime |
| 36 | + timestampType: str |
| 37 | + key: bytes |
| 38 | + value: Union[str, Type[BaseModel]] |
| 39 | + headers: List[Dict[str, bytes]] |
| 40 | + |
| 41 | + # validators |
| 42 | + _decode_key = validator("key", allow_reuse=True)(_base64_decode) |
| 43 | + |
| 44 | + @validator("value", pre=True, allow_reuse=True) |
| 45 | + def data_base64_decode(cls, value): |
| 46 | + as_bytes = _base64_decode(value) |
| 47 | + return _bytes_to_string(as_bytes) |
| 48 | + |
| 49 | + @validator("headers", pre=True, allow_reuse=True) |
| 50 | + def decode_headers_list(cls, value): |
| 51 | + for header in value: |
| 52 | + for key, values in header.items(): |
| 53 | + header[key] = bytes(values) |
| 54 | + return value |
| 55 | + |
| 56 | + |
| 57 | +class KafkaEventModel(BaseModel): |
| 58 | + """Self-managed Apache Kafka event trigger |
| 59 | + Documentation: |
| 60 | + -------------- |
| 61 | + - https://docs.aws.amazon.com/lambda/latest/dg/with-kafka.html |
| 62 | + """ |
| 63 | + |
| 64 | + eventSource: Literal["aws:SelfManagedKafka"] |
| 65 | + bootstrapServers: Optional[List[str]] |
| 66 | + records: Dict[str, List[KafkaRecordModel]] |
| 67 | + |
| 68 | + @validator("bootstrapServers", pre=True, allow_reuse=True) |
| 69 | + def split_servers(cls, value): |
| 70 | + return None if not value else value.split(SERVERS_DELIMITER) |
0 commit comments