PyPI - cledar-sdk - Versions diffs - 2.0.1__py3-none-any.whl → 2.0.3__py3-none-any.whl - Mend

cledar-sdk 2.0.1py3-none-any.whl → 2.0.3py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (85) hide show

cledar/__init__.py +0 -0
cledar/kafka/README.md +239 -0
cledar/kafka/__init__.py +40 -0
cledar/kafka/clients/base.py +98 -0
cledar/kafka/clients/consumer.py +110 -0
cledar/kafka/clients/producer.py +80 -0
cledar/kafka/config/schemas.py +178 -0
cledar/kafka/exceptions.py +22 -0
cledar/kafka/handlers/dead_letter.py +82 -0
cledar/kafka/handlers/parser.py +49 -0
cledar/kafka/logger.py +3 -0
cledar/kafka/models/input.py +13 -0
cledar/kafka/models/message.py +10 -0
cledar/kafka/models/output.py +8 -0
cledar/kafka/tests/.env.test.kafka +3 -0
cledar/kafka/tests/README.md +216 -0
cledar/kafka/tests/conftest.py +104 -0
cledar/kafka/tests/integration/__init__.py +1 -0
cledar/kafka/tests/integration/conftest.py +78 -0
cledar/kafka/tests/integration/helpers.py +47 -0
cledar/kafka/tests/integration/test_consumer_integration.py +375 -0
cledar/kafka/tests/integration/test_integration.py +394 -0
cledar/kafka/tests/integration/test_producer_consumer_interaction.py +388 -0
cledar/kafka/tests/integration/test_producer_integration.py +217 -0
cledar/kafka/tests/unit/__init__.py +1 -0
cledar/kafka/tests/unit/test_base_kafka_client.py +391 -0
cledar/kafka/tests/unit/test_config_validation.py +609 -0
cledar/kafka/tests/unit/test_dead_letter_handler.py +443 -0
cledar/kafka/tests/unit/test_error_handling.py +674 -0
cledar/kafka/tests/unit/test_input_parser.py +310 -0
cledar/kafka/tests/unit/test_input_parser_comprehensive.py +489 -0
cledar/kafka/tests/unit/test_utils.py +25 -0
cledar/kafka/tests/unit/test_utils_comprehensive.py +408 -0
cledar/kafka/utils/callbacks.py +19 -0
cledar/kafka/utils/messages.py +28 -0
cledar/kafka/utils/topics.py +2 -0
cledar/kserve/README.md +352 -0
cledar/kserve/__init__.py +3 -0
cledar/kserve/tests/__init__.py +0 -0
cledar/kserve/tests/test_utils.py +64 -0
cledar/kserve/utils.py +27 -0
cledar/logging/README.md +53 -0
cledar/logging/__init__.py +3 -0
cledar/logging/tests/test_universal_plaintext_formatter.py +249 -0
cledar/logging/universal_plaintext_formatter.py +94 -0
cledar/monitoring/README.md +71 -0
cledar/monitoring/__init__.py +3 -0
cledar/monitoring/monitoring_server.py +112 -0
cledar/monitoring/tests/integration/test_monitoring_server_int.py +162 -0
cledar/monitoring/tests/test_monitoring_server.py +59 -0
cledar/nonce/README.md +99 -0
cledar/nonce/__init__.py +3 -0
cledar/nonce/nonce_service.py +36 -0
cledar/nonce/tests/__init__.py +0 -0
cledar/nonce/tests/test_nonce_service.py +136 -0
cledar/redis/README.md +536 -0
cledar/redis/__init__.py +15 -0
cledar/redis/async_example.py +111 -0
cledar/redis/example.py +37 -0
cledar/redis/exceptions.py +22 -0
cledar/redis/logger.py +3 -0
cledar/redis/model.py +10 -0
cledar/redis/redis.py +525 -0
cledar/redis/redis_config_store.py +252 -0
cledar/redis/tests/test_async_integration_redis.py +158 -0
cledar/redis/tests/test_async_redis_service.py +380 -0
cledar/redis/tests/test_integration_redis.py +119 -0
cledar/redis/tests/test_redis_service.py +319 -0
cledar/storage/README.md +529 -0
cledar/storage/__init__.py +4 -0
cledar/storage/constants.py +3 -0
cledar/storage/exceptions.py +50 -0
cledar/storage/models.py +19 -0
cledar/storage/object_storage.py +955 -0
cledar/storage/tests/conftest.py +18 -0
cledar/storage/tests/test_abfs.py +164 -0
cledar/storage/tests/test_integration_filesystem.py +359 -0
cledar/storage/tests/test_integration_s3.py +453 -0
cledar/storage/tests/test_local.py +384 -0
cledar/storage/tests/test_s3.py +521 -0
{cledar_sdk-2.0.1.dist-info → cledar_sdk-2.0.3.dist-info}/METADATA +1 -1
cledar_sdk-2.0.3.dist-info/RECORD +84 -0
cledar_sdk-2.0.1.dist-info/RECORD +0 -4
{cledar_sdk-2.0.1.dist-info → cledar_sdk-2.0.3.dist-info}/WHEEL +0 -0
{cledar_sdk-2.0.1.dist-info → cledar_sdk-2.0.3.dist-info}/licenses/LICENSE +0 -0

cledar/kserve/README.md ADDED Viewed

@@ -0,0 +1,352 @@
+# KServe Service
+## Purpose
+The `cledar.kserve` package provides utilities for working with KServe inference services, particularly for handling CloudEvents headers that are used in KServe's event-driven architecture. It simplifies the extraction and parsing of metadata from CloudEvents headers, making it easier to integrate with KServe deployments.
+### Key Features
+- **CloudEvents Parsing**: Extract Kafka topic names from CloudEvents source headers
+- **Header Validation**: Robust validation of CloudEvents header format
+- **Type Safety**: Fully typed with Python type hints
+- **Well Tested**: Comprehensive unit tests covering edge cases
+- **Lightweight**: Minimal dependencies, focused utility functions
+### Use Cases
+- Parsing CloudEvents headers in KServe inference services
+- Extracting Kafka topic information from event-driven requests
+- Building event-driven ML inference pipelines
+- Integration with KServe and Knative Eventing
+## Installation
+This package is part of the `cledar-python-sdk`. Install it using:
+```bash
+# Install with uv (recommended)
+uv sync --all-groups
+# Or with pip
+pip install -e .
+```
+## Usage Example
+```python
+from cledar.kserve import get_input_topic
+# Example CloudEvents headers from KServe request
+headers = {
+    "ce-source": "kafka://my-cluster#input-topic",
+    "ce-type": "dev.knative.kafka.event",
+    "ce-id": "partition:0/offset:123",
+}
+# Extract the Kafka topic name
+topic = get_input_topic(headers)
+print(topic)  # Output: "input-topic"
+# Handle missing or invalid headers
+empty_headers = {}
+topic = get_input_topic(empty_headers)
+print(topic)  # Output: None
+# Handle headers without delimiter
+invalid_headers = {"ce-source": "kafka://my-cluster/topic"}
+topic = get_input_topic(invalid_headers)
+print(topic)  # Output: None
+```
+## Development
+### Project Structure
+```
+cledar/kserve/
+├── __init__.py              # Package initialization with exports
+├── utils.py                 # Utility functions for CloudEvents
+├── tests/
+│   ├── __init__.py         # Test package initialization
+│   └── test_utils.py       # Unit tests for utilities
+└── README.md               # This file
+```
+## Running Linters
+The project is configured for multiple linters (see `pyproject.toml` for configuration).
+### Available Linter Configurations
+The project includes configurations for:
+- **Pylint**: Python code analysis (`.tool.pylint` in `pyproject.toml`)
+- **Mypy**: Static type checking (`.tool.mypy` in `pyproject.toml`)
+- **Black**: Code formatting (`.tool.black` in `pyproject.toml`)
+### Installing Linters
+Linters are not included in the dev dependencies by default. Install them separately:
+```bash
+# Install all linters
+pip install pylint mypy black
+# Or with uv
+uv pip install pylint mypy black
+```
+### Running Linters
+Once installed, run them from the SDK root directory:
+```bash
+# From the SDK root directory
+cd /path/to/cledar-python-sdk
+# Run pylint on cledar.kserve
+pylint cledar/kserve/
+# Run mypy type checking (strict mode configured)
+mypy cledar/kserve/
+# Check code formatting with black
+black --check cledar/kserve/
+# Auto-format code
+black cledar/kserve/
+```
+### Run All Linters
+```bash
+# Run all linters in sequence
+pylint cledar/kserve/ && \
+mypy cledar/kserve/ && \
+black --check cledar/kserve/
+```
+### IDE Integration
+Most IDEs support these linters natively:
+- **VSCode**: Install Python extension, linters auto-detected via `pyproject.toml`
+- **PyCharm**: Enable in Settings → Tools → Python Integrated Tools
+- **Cursor**: Same as VSCode
+## Running Unit Tests
+Unit tests verify the functionality of the CloudEvents parsing utilities.
+### Run All Unit Tests
+```bash
+# From the SDK root directory
+cd /path/to/cledar-python-sdk
+# Run all tests using uv
+PYTHONPATH=$PWD uv run pytest cledar/kserve/tests/ -v
+```
+### Run Specific Test File
+```bash
+# Run specific test file
+PYTHONPATH=$PWD uv run pytest cledar/kserve/tests/test_utils.py -v
+```
+### Run Specific Test
+```bash
+# Run a specific test by name
+PYTHONPATH=$PWD uv run pytest cledar/kserve/tests/test_utils.py::test_get_input_topic_valid_source -v
+```
+### Run with Coverage
+```bash
+# Generate coverage report
+PYTHONPATH=$PWD uv run pytest cledar/kserve/tests/ \
+  --cov=cledar.kserve \
+  --cov-report=html \
+  --cov-report=term
+# View HTML report
+open htmlcov/index.html
+```
+### Unit Test Details
+- **Test Framework**: pytest
+- **Test Count**: 9 unit tests
+- **Execution Time**: ~0.04 seconds (fast, no external dependencies)
+#### What Unit Tests Cover:
+- ✅ Valid CloudEvents source parsing
+- ✅ Whitespace trimming and normalization
+- ✅ Missing header handling
+- ✅ Invalid format detection (no delimiter)
+- ✅ Empty topic after delimiter
+- ✅ Whitespace-only topics
+- ✅ Multiple delimiters in source
+- ✅ Empty source values
+- ✅ Complex topic names with namespaces
+## CI/CD Integration
+### GitLab CI Example
+```yaml
+test-kserve-service:
+  stage: test
+  image: python:3.12
+  script:
+    - pip install uv
+    - uv sync --all-groups
+    - PYTHONPATH=$PWD uv run pytest cledar/kserve/tests/ -v
+```
+### GitHub Actions Example
+```yaml
+name: KServe Service Tests
+on: [push, pull_request]
+jobs:
+  unit-tests:
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v3
+      - uses: actions/setup-python@v4
+        with:
+          python-version: '3.12'
+      - name: Install dependencies
+        run: |
+          pip install uv
+          uv sync --all-groups
+      - name: Run unit tests
+        run: PYTHONPATH=$PWD uv run pytest cledar/kserve/tests/ -v
+```
+## API Reference
+### Constants
+#### `CE_SOURCE_HEADER`
+The CloudEvents source header key used in KServe requests.
+```python
+CE_SOURCE_HEADER = "ce-source"
+```
+### Functions
+#### `get_input_topic(headers: dict[str, str]) -> str | None`
+Extract the Kafka topic name from CloudEvents source header.
+Parses the 'ce-source' header value which is expected to be in the format `prefix#topic_name` and returns the topic name after the '#' delimiter.
+**Parameters:**
+- `headers` (dict[str, str]): Dictionary of HTTP headers containing CloudEvents metadata.
+**Returns:**
+- `str | None`: The extracted topic name if the header exists, contains '#', and has a non-empty topic name after the delimiter. Returns `None` otherwise.
+**Example:**
+```python
+>>> headers = {"ce-source": "kafka://cluster#my-topic"}
+>>> get_input_topic(headers)
+'my-topic'
+>>> headers = {"ce-source": "kafka://cluster#"}
+>>> get_input_topic(headers)
+None
+>>> headers = {}
+>>> get_input_topic(headers)
+None
+```
+**Edge Cases Handled:**
+- Missing `ce-source` header → Returns `None`
+- No `#` delimiter in source → Returns `None`
+- Empty topic after `#` → Returns `None`
+- Whitespace-only topic → Returns `None` (after stripping)
+- Leading/trailing whitespace → Stripped automatically
+- Multiple `#` delimiters → Only first `#` is used as delimiter
+## CloudEvents Format
+The `ce-source` header in KServe follows the CloudEvents specification and typically has this format:
+```
+<protocol>://<cluster-or-namespace>#<topic-name>
+```
+**Examples:**
+- `kafka://prod-cluster#user-events`
+- `kafka://namespace.kafka#model-predictions`
+- `kafka://local#ml-inference-requests`
+The `get_input_topic` function extracts the `<topic-name>` portion after the `#` delimiter.
+## Integration with KServe
+### Example KServe Predictor
+```python
+from kserve import Model, ModelServer
+from cledar.kserve import get_input_topic
+import logging
+logger = logging.getLogger(__name__)
+class MyPredictor(Model):
+    def __init__(self, name: str):
+        super().__init__(name)
+    def predict(self, request: dict, headers: dict[str, str]) -> dict:
+        # Extract source topic from CloudEvents headers
+        source_topic = get_input_topic(headers)
+        if source_topic:
+            logger.info(f"Processing request from topic: {source_topic}")
+        else:
+            logger.warning("Could not determine source topic from headers")
+        # Your inference logic here
+        predictions = self.model.predict(request["instances"])
+        return {"predictions": predictions}
+if __name__ == "__main__":
+    model = MyPredictor("my-model")
+    ModelServer().start([model])
+```
+## Running Pre-commit Checks
+```bash
+# Format code
+uv run black cledar/kserve/
+# Check types
+uv run mypy cledar/kserve/
+# Run linter
+uv run pylint cledar/kserve/
+# Run all tests
+PYTHONPATH=$PWD uv run pytest cledar/kserve/tests/ -v
+```
+## License
+See the main repository LICENSE file.
+## Support
+For issues, questions, or contributions, please refer to the main repository's contribution guidelines.

cledar/kserve/__init__.py ADDED Viewed

@@ -0,0 +1,3 @@
+from .utils import get_input_topic
+__all__ = ["get_input_topic"]

cledar/kserve/tests/__init__.py ADDED Viewed

File without changes

cledar/kserve/tests/test_utils.py ADDED Viewed

@@ -0,0 +1,64 @@
+from cledar.kserve.utils import get_input_topic
+def test_get_input_topic_valid_source() -> None:
+    headers = {"ce-source": "kafka://cluster#my-topic"}
+    result = get_input_topic(headers)
+    assert result == "my-topic"
+def test_get_input_topic_with_whitespace() -> None:
+    headers = {"ce-source": "kafka://cluster# my-topic "}
+    result = get_input_topic(headers)
+    assert result == "my-topic"
+def test_get_input_topic_missing_header() -> None:
+    headers: dict[str, str] = {}
+    result = get_input_topic(headers)
+    assert result is None
+def test_get_input_topic_no_delimiter() -> None:
+    headers = {"ce-source": "kafka://cluster/my-topic"}
+    result = get_input_topic(headers)
+    assert result is None
+def test_get_input_topic_empty_after_delimiter() -> None:
+    headers = {"ce-source": "kafka://cluster#"}
+    result = get_input_topic(headers)
+    assert result is None
+def test_get_input_topic_only_whitespace_after_delimiter() -> None:
+    headers = {"ce-source": "kafka://cluster#   "}
+    result = get_input_topic(headers)
+    assert result is None
+def test_get_input_topic_multiple_delimiters() -> None:
+    headers = {"ce-source": "kafka://cluster#my-topic#with-hash"}
+    result = get_input_topic(headers)
+    assert result == "my-topic#with-hash"
+def test_get_input_topic_empty_source_value() -> None:
+    headers = {"ce-source": ""}
+    result = get_input_topic(headers)
+    assert result is None
+def test_get_input_topic_complex_topic_name() -> None:
+    headers = {"ce-source": "kafka://prod.cluster.example.com#namespace.my-topic-v2"}
+    result = get_input_topic(headers)
+    assert result == "namespace.my-topic-v2"

cledar/kserve/utils.py ADDED Viewed

@@ -0,0 +1,27 @@
+CE_SOURCE_HEADER = "ce-source"
+def get_input_topic(headers: dict[str, str]) -> str | None:
+    """Extract the Kafka topic name from CloudEvents source header.
+    Parses the 'ce-source' header value which is expected to be in the format
+    'prefix#topic_name' and returns the topic name after the '#' delimiter.
+    Args:
+        headers: Dictionary of HTTP headers containing CloudEvents metadata.
+    Returns:
+        The extracted topic name if the header exists, contains '#', and has
+        a non-empty topic name after the delimiter. Returns None otherwise.
+    Example:
+        >>> headers = {"ce-source": "kafka://cluster#my-topic"}
+        >>> get_input_topic(headers)
+        'my-topic'
+    """
+    source = headers.get(CE_SOURCE_HEADER)
+    if not source or "#" not in source:
+        return None
+    topic = source.split("#", 1)[1].strip()
+    return topic if topic else None

cledar/logging/README.md ADDED Viewed

@@ -0,0 +1,53 @@
+# Universal Formatter
+The `UniversalPlaintextFormatter` is a custom logging formatter that extends the standard `logging.Formatter` class. It adds the ability to include extra attributes from log records while excluding standard attributes and configurable keys.
+## Usage
+To use the `UniversalPlaintextFormatter` in your logging configuration, add the following to your `logging.conf` file:
+```ini
+[formatter_plaintextFormatter]
+class=questions_generator.common_services.logging.universal_formatter.UniversalPlaintextFormatter
+format=%(asctime)s %(name)s [%(levelname)s]: %(message)s
+datefmt=%Y-%m-%d %H:%M:%S
+```
+## Features
+- Extends the standard logging.Formatter
+- Automatically includes extra attributes from log records
+- Excludes standard LogRecord attributes to keep logs clean
+- Configurable exclusion of additional keys
+## Configuration Options
+In addition to the standard formatter options, you can configure which keys to exclude from the log output:
+```ini
+[formatter_plaintextFormatter]
+class=questions_generator.common_services.logging.universal_formatter.UniversalPlaintextFormatter
+format=%(asctime)s %(name)s [%(levelname)s]: %(message)s
+datefmt=%Y-%m-%d %H:%M:%S
+exclude_keys=key1,key2,key3
+```
+The `exclude_keys` option allows you to specify a comma-separated list of keys that should be excluded from the log output, in addition to the standard LogRecord attributes.
+## Example
+When using this formatter, any extra attributes added to the log record will be automatically included in the log output:
+```python
+import logging
+logger = logging.getLogger(__name__)
+logger.info("User logged in", extra={"user_id": 123, "ip_address": "192.168.1.1"})
+```
+Output:
+```
+2023-08-04 12:34:56 my_module [INFO]: User logged in
+    user_id: 123
+    ip_address: 192.168.1.1
+```

cledar/logging/__init__.py ADDED Viewed

@@ -0,0 +1,3 @@
+from .universal_plaintext_formatter import UniversalPlaintextFormatter
+__all__ = ["UniversalPlaintextFormatter"]

cledar-sdk 2.0.1__py3-none-any.whl → 2.0.3__py3-none-any.whl

cledar-sdk 2.0.1py3-none-any.whl → 2.0.3py3-none-any.whl