PyPI - brawny - Versions diffs - 0.1.13__py3-none-any.whl → 0.1.22__py3-none-any.whl - Mend

brawny 0.1.13py3-none-any.whl → 0.1.22py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (135) hide show

brawny/__init__.py +2 -0
brawny/_context.py +5 -5
brawny/_rpc/__init__.py +36 -12
brawny/_rpc/broadcast.py +14 -13
brawny/_rpc/caller.py +243 -0
brawny/_rpc/client.py +539 -0
brawny/_rpc/clients.py +11 -11
brawny/_rpc/context.py +23 -0
brawny/_rpc/errors.py +465 -31
brawny/_rpc/gas.py +7 -6
brawny/_rpc/pool.py +18 -0
brawny/_rpc/retry.py +266 -0
brawny/_rpc/retry_policy.py +81 -0
brawny/accounts.py +28 -9
brawny/alerts/__init__.py +15 -18
brawny/alerts/abi_resolver.py +212 -36
brawny/alerts/base.py +2 -2
brawny/alerts/contracts.py +77 -10
brawny/alerts/errors.py +30 -3
brawny/alerts/events.py +38 -5
brawny/alerts/health.py +19 -13
brawny/alerts/send.py +513 -55
brawny/api.py +39 -11
brawny/assets/AGENTS.md +325 -0
brawny/async_runtime.py +48 -0
brawny/chain.py +3 -3
brawny/cli/commands/__init__.py +2 -0
brawny/cli/commands/console.py +69 -19
brawny/cli/commands/contract.py +2 -2
brawny/cli/commands/controls.py +121 -0
brawny/cli/commands/health.py +2 -2
brawny/cli/commands/job_dev.py +6 -5
brawny/cli/commands/jobs.py +99 -2
brawny/cli/commands/maintenance.py +13 -29
brawny/cli/commands/migrate.py +1 -0
brawny/cli/commands/run.py +10 -3
brawny/cli/commands/script.py +8 -3
brawny/cli/commands/signer.py +143 -26
brawny/cli/helpers.py +0 -3
brawny/cli_templates.py +25 -349
brawny/config/__init__.py +4 -1
brawny/config/models.py +43 -57
brawny/config/parser.py +268 -57
brawny/config/validation.py +52 -15
brawny/daemon/context.py +4 -2
brawny/daemon/core.py +185 -63
brawny/daemon/loops.py +166 -98
brawny/daemon/supervisor.py +261 -0
brawny/db/__init__.py +14 -26
brawny/db/base.py +248 -151
brawny/db/global_cache.py +11 -1
brawny/db/migrate.py +175 -28
brawny/db/migrations/001_init.sql +4 -3
brawny/db/migrations/010_add_nonce_gap_index.sql +1 -1
brawny/db/migrations/011_add_job_logs.sql +1 -2
brawny/db/migrations/012_add_claimed_by.sql +2 -2
brawny/db/migrations/013_attempt_unique.sql +10 -0
brawny/db/migrations/014_add_lease_expires_at.sql +5 -0
brawny/db/migrations/015_add_signer_alias.sql +14 -0
brawny/db/migrations/016_runtime_controls_and_quarantine.sql +32 -0
brawny/db/migrations/017_add_job_drain.sql +6 -0
brawny/db/migrations/018_add_nonce_reset_audit.sql +20 -0
brawny/db/migrations/019_add_job_cooldowns.sql +8 -0
brawny/db/migrations/020_attempt_unique_initial.sql +7 -0
brawny/db/ops/__init__.py +3 -25
brawny/db/ops/logs.py +1 -2
brawny/db/queries.py +47 -91
brawny/db/serialized.py +65 -0
brawny/db/sqlite/__init__.py +1001 -0
brawny/db/sqlite/connection.py +231 -0
brawny/db/sqlite/execute.py +116 -0
brawny/db/sqlite/mappers.py +190 -0
brawny/db/sqlite/repos/attempts.py +372 -0
brawny/db/sqlite/repos/block_state.py +102 -0
brawny/db/sqlite/repos/cache.py +104 -0
brawny/db/sqlite/repos/intents.py +1021 -0
brawny/db/sqlite/repos/jobs.py +200 -0
brawny/db/sqlite/repos/maintenance.py +182 -0
brawny/db/sqlite/repos/signers_nonces.py +566 -0
brawny/db/sqlite/tx.py +119 -0
brawny/http.py +194 -0
brawny/invariants.py +11 -24
brawny/jobs/base.py +8 -0
brawny/jobs/job_validation.py +2 -1
brawny/keystore.py +83 -7
brawny/lifecycle.py +64 -12
brawny/logging.py +0 -2
brawny/metrics.py +84 -12
brawny/model/contexts.py +111 -9
brawny/model/enums.py +1 -0
brawny/model/errors.py +18 -0
brawny/model/types.py +47 -131
brawny/network_guard.py +133 -0
brawny/networks/__init__.py +5 -5
brawny/networks/config.py +1 -7
brawny/networks/manager.py +14 -11
brawny/runtime_controls.py +74 -0
brawny/scheduler/poller.py +11 -7
brawny/scheduler/reorg.py +95 -39
brawny/scheduler/runner.py +442 -168
brawny/scheduler/shutdown.py +3 -3
brawny/script_tx.py +3 -3
brawny/telegram.py +53 -7
brawny/testing.py +1 -0
brawny/timeout.py +38 -0
brawny/tx/executor.py +922 -308
brawny/tx/intent.py +54 -16
brawny/tx/monitor.py +31 -12
brawny/tx/nonce.py +212 -90
brawny/tx/replacement.py +69 -18
brawny/tx/retry_policy.py +24 -0
brawny/tx/stages/types.py +75 -0
brawny/types.py +18 -0
brawny/utils.py +41 -0
{brawny-0.1.13.dist-info → brawny-0.1.22.dist-info}/METADATA +3 -3
brawny-0.1.22.dist-info/RECORD +163 -0
brawny/_rpc/manager.py +0 -982
brawny/_rpc/selector.py +0 -156
brawny/db/base_new.py +0 -165
brawny/db/mappers.py +0 -182
brawny/db/migrations/008_add_transactions.sql +0 -72
brawny/db/ops/attempts.py +0 -108
brawny/db/ops/blocks.py +0 -83
brawny/db/ops/cache.py +0 -93
brawny/db/ops/intents.py +0 -296
brawny/db/ops/jobs.py +0 -110
brawny/db/ops/nonces.py +0 -322
brawny/db/postgres.py +0 -2535
brawny/db/postgres_new.py +0 -196
brawny/db/sqlite.py +0 -2733
brawny/db/sqlite_new.py +0 -191
brawny-0.1.13.dist-info/RECORD +0 -141
{brawny-0.1.13.dist-info → brawny-0.1.22.dist-info}/WHEEL +0 -0
{brawny-0.1.13.dist-info → brawny-0.1.22.dist-info}/entry_points.txt +0 -0
{brawny-0.1.13.dist-info → brawny-0.1.22.dist-info}/top_level.txt +0 -0

brawny/alerts/send.py CHANGED Viewed

@@ -19,11 +19,16 @@ Usage:
 from __future__ import annotations
 import asyncio
+import hashlib
 import threading
+import time
+from collections import deque
 from dataclasses import dataclass, field
 from datetime import datetime
 from enum import Enum
-from typing import TYPE_CHECKING, Any, Callable, Coroutine
+from typing import TYPE_CHECKING, Any, Callable
+from cachetools import TTLCache
 if TYPE_CHECKING:
     from brawny.telegram import TelegramBot
@@ -31,6 +36,19 @@ if TYPE_CHECKING:
 import httpx
 from brawny.logging import get_logger
+from brawny.metrics import (
+    ALERTS_ENQUEUED,
+    ALERTS_DROPPED,
+    ALERTS_LAST_ERROR_TIMESTAMP,
+    ALERTS_LAST_SUCCESS_TIMESTAMP,
+    ALERTS_OLDEST_QUEUED_AGE_SECONDS,
+    ALERTS_QUEUE_DEPTH,
+    ALERTS_RETRIED,
+    ALERTS_SENT,
+    ALERTS_WORKER_ALIVE,
+    get_metrics,
+)
+from brawny.network_guard import allow_network_calls
 logger = get_logger(__name__)
@@ -70,29 +88,382 @@ class AlertConfig:
 # NOTE: No module-level httpx.AsyncClient - asyncio objects are not safe to share
 # across multiple event loops / loop lifetimes. For low-volume alerts, we create
 # a fresh client per request (httpx context manager handles cleanup).
-_last_sent: dict[str, datetime] = {}
+# Multi-threaded access - protected by _last_sent_lock
+# Medium cardinality keys (job_id:event:dest:dest_id): maxsize=10K, ttl=1h
+_last_sent: TTLCache[str, datetime] = TTLCache(maxsize=10_000, ttl=3600)
 # Use threading.Lock, not asyncio.Lock - avoids event loop binding issues
 _last_sent_lock = threading.Lock()
+ALERT_QUEUE_MAXSIZE = 1000
+ALERT_SEND_MAX_ATTEMPTS = 5
+ALERT_SEND_BACKOFF_BASE_SECONDS = 1.0
+ALERT_SEND_BACKOFF_MAX_SECONDS = 30.0
+ALERT_WORKER_POLL_SECONDS = 0.1
+ALERT_FLUSH_TIMEOUT_SECONDS = 3.0
+ALERT_LOG_THROTTLE_SECONDS = 60.0
+ALERT_HEALTH_MAX_OLDEST_AGE_SECONDS = 120.0
-async def send_alert(payload: AlertPayload, config: AlertConfig) -> None:
-    """Send alert to configured destinations. Fire-and-forget."""
-    tasks: list[Coroutine[Any, Any, None]] = []
+@dataclass
+class _AlertTask:
+    payload: AlertPayload
+    destination_type: str
+    destination_id: str
+    channel: str
+    enqueued_at: float
+    attempt: int = 0
+    next_attempt_at: float = 0.0
+    alert_id: str = ""
+    telegram_token: str | None = None
+    webhook_url: str | None = None
+class AlertService:
+    def __init__(
+        self,
+        *,
+        maxsize: int,
+        max_attempts: int,
+        backoff_base_seconds: float,
+        backoff_max_seconds: float,
+        health_max_oldest_age_seconds: float,
+    ) -> None:
+        self._queue: deque[_AlertTask] = deque()
+        self._delayed: list[_AlertTask] = []
+        self._maxsize = maxsize
+        self._max_attempts = max_attempts
+        self._backoff_base_seconds = backoff_base_seconds
+        self._backoff_max_seconds = backoff_max_seconds
+        self._health_max_oldest_age_seconds = health_max_oldest_age_seconds
+        self._accepting = True
+        self._stop = False
+        self._stop_deadline: float | None = None
+        self._worker_task: asyncio.Task | None = None
+        self._wakeup: asyncio.Event | None = None
+        self._worker_alive = False
+        self._last_success_ts: float | None = None
+        self._last_error_ts: float | None = None
+        self._last_error_type: str | None = None
+        self._last_error_message: str | None = None
+        self._log_throttle: dict[str, float] = {}
+    async def start(self) -> None:
+        if self._worker_task and not self._worker_task.done():
+            return
+        self._accepting = True
+        self._stop = False
+        self._stop_deadline = None
+        self._wakeup = asyncio.Event()
+        self._worker_task = asyncio.create_task(self._run(), name="alert-sender")
+    async def stop(self, flush_timeout: float) -> None:
+        self._accepting = False
+        self._stop = True
+        self._stop_deadline = time.time() + flush_timeout
+        if self._wakeup is not None:
+            self._wakeup.set()
+        task = self._worker_task
+        if task is None:
+            return
+        try:
+            await asyncio.wait_for(task, timeout=flush_timeout)
+        except asyncio.TimeoutError:
+            task.cancel()
+        self._update_queue_metrics(now=time.time())
+    def enqueue(self, task: _AlertTask) -> bool:
+        if not self._accepting:
+            self._record_drop("shutdown", channel=task.channel)
+            return False
+        if self._queue_size() >= self._maxsize:
+            self._record_drop("queue_full", channel=task.channel)
+            self._log_throttled(
+                "queue_full",
+                "alert.queue_full",
+                maxsize=self._maxsize,
+                channel=task.channel,
+            )
+            return False
+        self._queue.append(task)
+        metrics = get_metrics()
+        metrics.counter(ALERTS_ENQUEUED).inc()
+        self._update_queue_metrics(now=time.time())
+        if self._wakeup is not None:
+            self._wakeup.set()
+        return True
+    def configure_health_threshold(self, max_oldest_age_seconds: float) -> None:
+        self._health_max_oldest_age_seconds = max_oldest_age_seconds
+    async def _run(self) -> None:
+        self._set_worker_alive(True)
+        try:
+            while True:
+                now = time.time()
+                if self._stop and self._stop_deadline and now >= self._stop_deadline:
+                    self._drop_remaining("shutdown_timeout")
+                    break
+                self._move_due_delayed(now)
+                if self._stop and not self._queue and not self._delayed:
+                    break
+                if self._queue:
+                    task = self._queue.popleft()
+                    self._update_queue_metrics(now=now)
+                    await self._process_task(task)
+                    continue
+                wait = self._next_wait_seconds(now)
+                try:
+                    if self._wakeup is not None:
+                        self._wakeup.clear()
+                        await asyncio.wait_for(self._wakeup.wait(), timeout=wait)
+                    else:
+                        await asyncio.sleep(wait)
+                except asyncio.TimeoutError:
+                    pass
+        finally:
+            self._set_worker_alive(False)
+    async def _process_task(self, task: _AlertTask) -> None:
+        metrics = get_metrics()
+        task.attempt += 1
+        attempt = task.attempt
+        self._log_state(task, state="sending")
+        try:
+            await _send_task(task)
+        except Exception as exc:
+            retryable, error_type = _classify_error(exc)
+            self._record_error(error_type, str(exc))
+            if retryable and attempt < self._max_attempts:
+                metrics.counter(ALERTS_RETRIED).inc()
+                task.next_attempt_at = time.time() + _backoff_seconds(
+                    attempt,
+                    base_seconds=self._backoff_base_seconds,
+                    max_seconds=self._backoff_max_seconds,
+                )
+                self._log_state(task, state="retry_scheduled", error_type=error_type)
+                self._delayed.append(task)
+                self._update_queue_metrics(now=time.time())
+                if self._wakeup is not None:
+                    self._wakeup.set()
+                return
+            reason = "max_attempts" if attempt >= self._max_attempts else "non_retryable"
+            self._log_state(task, state="dropped", error_type=error_type)
+            self._record_drop(reason, channel=task.channel)
+            return
+        metrics.counter(ALERTS_SENT).inc()
+        self._record_success()
+        self._log_state(task, state="sent")
+    def _record_drop(self, reason: str, *, channel: str) -> None:
+        metrics = get_metrics()
+        metrics.counter(ALERTS_DROPPED).inc(reason=reason, channel=channel)
+    def _record_success(self) -> None:
+        self._last_success_ts = time.time()
+        metrics = get_metrics()
+        metrics.gauge(ALERTS_LAST_SUCCESS_TIMESTAMP).set(self._last_success_ts)
+    def _record_error(self, error_type: str, message: str) -> None:
+        self._last_error_ts = time.time()
+        self._last_error_type = error_type
+        self._last_error_message = message[:200]
+        metrics = get_metrics()
+        metrics.gauge(ALERTS_LAST_ERROR_TIMESTAMP).set(self._last_error_ts)
+    def _queue_size(self) -> int:
+        return len(self._queue) + len(self._delayed)
+    def _oldest_age_seconds(self, now: float) -> float:
+        if not self._queue and not self._delayed:
+            return 0.0
+        oldest = min(
+            [task.enqueued_at for task in self._queue]
+            + [task.enqueued_at for task in self._delayed]
+        )
+        return max(0.0, now - oldest)
+    def _update_queue_metrics(self, now: float) -> None:
+        metrics = get_metrics()
+        metrics.gauge(ALERTS_QUEUE_DEPTH).set(self._queue_size())
+        metrics.gauge(ALERTS_OLDEST_QUEUED_AGE_SECONDS).set(self._oldest_age_seconds(now))
+    def _move_due_delayed(self, now: float) -> None:
+        if not self._delayed:
+            return
+        due: list[_AlertTask] = []
+        remaining: list[_AlertTask] = []
+        for task in self._delayed:
+            if task.next_attempt_at <= now:
+                due.append(task)
+            else:
+                remaining.append(task)
+        self._delayed = remaining
+        if due:
+            self._queue.extend(due)
+            self._update_queue_metrics(now=now)
+    def _next_wait_seconds(self, now: float) -> float:
+        if not self._delayed:
+            return ALERT_WORKER_POLL_SECONDS
+        next_due = min(task.next_attempt_at for task in self._delayed)
+        wait = max(0.0, next_due - now)
+        return min(ALERT_WORKER_POLL_SECONDS, wait)
+    def _set_worker_alive(self, alive: bool) -> None:
+        self._worker_alive = alive
+        metrics = get_metrics()
+        metrics.gauge(ALERTS_WORKER_ALIVE).set(1.0 if alive else 0.0)
+    def _drop_remaining(self, reason: str) -> None:
+        while self._queue:
+            task = self._queue.popleft()
+            self._record_drop(reason, channel=task.channel)
+        while self._delayed:
+            task = self._delayed.pop()
+            self._record_drop(reason, channel=task.channel)
+        self._update_queue_metrics(now=time.time())
+    def _log_state(self, task: _AlertTask, *, state: str, error_type: str | None = None) -> None:
+        logger.info(
+            "alert.delivery_state",
+            alert_id=task.alert_id,
+            attempt=task.attempt,
+            state=state,
+            error_type=error_type,
+            channel=task.channel,
+        )
+    def _log_throttled(self, reason: str, event: str, **fields: object) -> None:
+        now = time.time()
+        last = self._log_throttle.get(reason)
+        if last is not None and now - last < ALERT_LOG_THROTTLE_SECONDS:
+            return
+        self._log_throttle[reason] = now
+        logger.warning(event, reason=reason, **fields)
+    def health_snapshot(self) -> dict[str, object]:
+        now = time.time()
+        queue_depth = self._queue_size()
+        oldest_age = self._oldest_age_seconds(now)
+        alive = self._worker_alive
+        healthy = queue_depth == 0 or (alive and oldest_age < self._health_max_oldest_age_seconds)
+        return {
+            "alive": alive,
+            "queue_depth": queue_depth,
+            "oldest_queued_age_seconds": oldest_age,
+            "healthy": healthy,
+            "last_success_timestamp": self._last_success_ts,
+            "last_error_timestamp": self._last_error_ts,
+            "last_error_type": self._last_error_type,
+            "last_error_message": self._last_error_message,
+        }
+def _make_task(
+    payload: AlertPayload,
+    *,
+    destination_type: str,
+    destination_id: str,
+    telegram_token: str | None = None,
+    webhook_url: str | None = None,
+) -> _AlertTask:
+    enqueued_at = time.time()
+    alert_id = _make_alert_id(payload, destination_type, destination_id)
+    return _AlertTask(
+        payload=payload,
+        destination_type=destination_type,
+        destination_id=destination_id,
+        channel=destination_type,
+        enqueued_at=enqueued_at,
+        next_attempt_at=enqueued_at,
+        alert_id=alert_id,
+        telegram_token=telegram_token,
+        webhook_url=webhook_url,
+    )
+def _make_alert_id(payload: AlertPayload, destination_type: str, destination_id: str) -> str:
+    raw = f"{destination_type}:{destination_id}:{payload.job_id}:{payload.event_type.value}:{payload.message}"
+    return hashlib.sha1(raw.encode("utf-8")).hexdigest()[:12]
+def _backoff_seconds(attempt: int, *, base_seconds: float, max_seconds: float) -> float:
+    return min(base_seconds * (2 ** (attempt - 1)), max_seconds)
+def _classify_error(exc: Exception) -> tuple[bool, str]:
+    if isinstance(exc, httpx.TimeoutException):
+        return True, "timeout"
+    if isinstance(exc, httpx.RequestError):
+        return True, "network_error"
+    if isinstance(exc, httpx.HTTPStatusError):
+        status = exc.response.status_code
+        error_type = f"http_{status}"
+        if status == 429 or 500 <= status < 600:
+            return True, error_type
+        if status in (400, 401, 403, 404):
+            return False, error_type
+        return False, error_type
+    return False, type(exc).__name__
+_alert_service: AlertService | None = None
+def set_alert_service(service: AlertService | None) -> None:
+    global _alert_service
+    _alert_service = service
+def _require_alert_service() -> AlertService:
+    if _alert_service is None:
+        raise RuntimeError("AlertService is not initialized")
+    return _alert_service
+async def send_alert(payload: AlertPayload, config: AlertConfig) -> None:
+    """Enqueue alert for background delivery. Never blocks core path."""
+    service = _require_alert_service()
     if config.telegram_token and config.telegram_chat_ids:
         for chat_id in config.telegram_chat_ids:
             if _should_send(payload, "telegram", chat_id, config.rate_limit_seconds):
-                tasks.append(_send_telegram(config.telegram_token, chat_id, payload))
+                service.enqueue(
+                    _make_task(
+                        payload,
+                        destination_type="telegram",
+                        destination_id=str(chat_id),
+                        telegram_token=config.telegram_token,
+                    )
+                )
     if config.webhook_url:
         if _should_send(payload, "webhook", config.webhook_url, config.rate_limit_seconds):
-            tasks.append(_send_webhook(config.webhook_url, payload))
+            service.enqueue(
+                _make_task(
+                    payload,
+                    destination_type="webhook",
+                    destination_id=config.webhook_url,
+                    webhook_url=config.webhook_url,
+                )
+            )
+def enqueue_alert(payload: AlertPayload, config: AlertConfig) -> None:
+    """Sync wrapper for enqueuing alerts from non-async code."""
+    from brawny.async_runtime import run_sync
+    run_sync(send_alert(payload, config))
+def configure_alert_worker(*, health_max_oldest_age_seconds: float | None = None) -> None:
+    service = _require_alert_service()
+    if health_max_oldest_age_seconds is not None:
+        service.configure_health_threshold(health_max_oldest_age_seconds)
-    if tasks:
-        results = await asyncio.gather(*tasks, return_exceptions=True)
-        for i, result in enumerate(results):
-            if isinstance(result, Exception):
-                _log_failure(payload, tasks[i], result)
+def get_alert_worker_health() -> dict[str, object]:
+    service = _require_alert_service()
+    return service.health_snapshot()
 def _should_send(
@@ -131,9 +502,10 @@ async def _send_telegram(token: str, chat_id: str, payload: AlertPayload) -> Non
         "parse_mode": parse_mode,
         "disable_web_page_preview": True,
     }
-    async with httpx.AsyncClient(timeout=10.0) as client:
-        resp = await client.post(url, json=data)
-        resp.raise_for_status()
+    with allow_network_calls(reason="alerts"):
+        async with httpx.AsyncClient(timeout=10.0) as client:
+            resp = await client.post(url, json=data)
+            resp.raise_for_status()
 async def _send_webhook(url: str, payload: AlertPayload) -> None:
@@ -149,48 +521,42 @@ async def _send_webhook(url: str, payload: AlertPayload) -> None:
     Do not add fields without versioning discussion.
     """
-    async with httpx.AsyncClient(timeout=10.0) as client:
-        resp = await client.post(
-            url,
-            json={
-                "job_id": payload.job_id,
-                "job_name": payload.job_name,
-                "event_type": payload.event_type.value,
-                "message": payload.message,
-                "chain_id": payload.chain_id,
-                "timestamp": payload.timestamp.isoformat() + "Z",
-            },
-        )
-        resp.raise_for_status()
+    with allow_network_calls(reason="alerts"):
+        async with httpx.AsyncClient(timeout=10.0) as client:
+            resp = await client.post(
+                url,
+                json={
+                    "job_id": payload.job_id,
+                    "job_name": payload.job_name,
+                    "event_type": payload.event_type.value,
+                    "message": payload.message,
+                    "chain_id": payload.chain_id,
+                    "timestamp": payload.timestamp.isoformat() + "Z",
+                },
+            )
+            resp.raise_for_status()
-def _log_failure(payload: AlertPayload, task: Coroutine[Any, Any, None], error: Exception) -> None:
-    """Log alert failure with enough context to debug."""
-    task_name = task.__qualname__ if hasattr(task, "__qualname__") else str(task)
+async def _send_task(task: _AlertTask) -> None:
+    if task.destination_type == "telegram":
+        if task.telegram_token is None:
+            raise RuntimeError("telegram_token is required")
+        await _send_telegram(task.telegram_token, task.destination_id, task.payload)
+        return
+    if task.destination_type == "webhook":
+        if task.webhook_url is None:
+            raise RuntimeError("webhook_url is required")
+        await _send_webhook(task.webhook_url, task.payload)
+        return
+    raise RuntimeError(f"Unknown destination type: {task.destination_type}")
-    if "telegram" in task_name.lower():
-        logger.warning(
-            "alert_delivery_failed",
-            job_id=payload.job_id,
-            event_type=payload.event_type.value,
-            destination="telegram",
-            error=str(error),
-        )
-    elif "webhook" in task_name.lower():
-        logger.warning(
-            "alert_delivery_failed",
-            job_id=payload.job_id,
-            event_type=payload.event_type.value,
-            destination="webhook",
-            error=str(error),
-        )
-    else:
-        logger.warning(
-            "alert_delivery_failed",
-            job_id=payload.job_id,
-            event_type=payload.event_type.value,
-            error=str(error),
-        )
+def flush_alert_queue(timeout_seconds: float | None = None) -> None:
+    timeout = ALERT_FLUSH_TIMEOUT_SECONDS if timeout_seconds is None else timeout_seconds
+    service = _require_alert_service()
+    from brawny.async_runtime import run_sync
+    run_sync(service.stop(flush_timeout=timeout))
 # =============================================================================
@@ -299,7 +665,9 @@ async def _send_alert_logged(payload: AlertPayload, config: AlertConfig) -> None
 # =============================================================================
 # Separate rate limiting for health alerts (prevents job alert noise from blocking health)
-_health_last_sent: dict[str, datetime] = {}
+# Multi-threaded access - protected by _health_lock
+# Low cardinality keys (chat IDs): maxsize=1K, ttl=1h
+_health_last_sent: TTLCache[str, datetime] = TTLCache(maxsize=1_000, ttl=3600)
 _health_lock = threading.Lock()
 HEALTH_RATE_LIMIT_SECONDS = 1.0  # Min interval between health messages to same chat
@@ -362,3 +730,93 @@ def create_send_health(bot: "TelegramBot") -> "Callable[[str, str], None]":
             )
     return send_health
+# =============================================================================
+# JobAlertSender for ctx.alert() in Lifecycle Hooks
+# =============================================================================
+class JobAlertSender:
+    """Alert sender bound to a specific job's routing configuration.
+    Used by lifecycle contexts (TriggerContext, SuccessContext, FailureContext)
+    to provide ctx.alert() that routes to job-specific destinations.
+    This class implements the AlertSender protocol from model.contexts.
+    """
+    def __init__(
+        self,
+        *,
+        telegram_bot: "TelegramBot | None",
+        telegram_config: Any,  # TelegramConfig
+        job_alert_to: list[str] | None,
+        job_id: str,
+    ) -> None:
+        """Initialize with job-specific routing.
+        Args:
+            telegram_bot: TelegramBot instance (None if not configured)
+            telegram_config: TelegramConfig with chats, default, parse_mode
+            job_alert_to: Job-specific alert destinations (or None for default)
+            job_id: Job ID for logging
+        """
+        self._bot = telegram_bot
+        self._tg_config = telegram_config
+        self._job_alert_to = job_alert_to
+        self._job_id = job_id
+    def send(
+        self,
+        message: str,
+        *,
+        to: str | list[str] | None = None,
+        parse_mode: str | None = None,
+    ) -> None:
+        """Send alert to configured destinations.
+        Routing priority:
+        1. `to` parameter (explicit override)
+        2. job_alert_to (job-specific config)
+        3. telegram.default (global default)
+        Args:
+            message: Alert text (up to 4096 characters)
+            to: Override routing target (name, ID, or list)
+            parse_mode: "Markdown", "MarkdownV2", "HTML", or None for config default
+        """
+        if not self._bot or not self._tg_config:
+            return  # Silent no-op (warned once at startup)
+        from brawny.alerts.routing import resolve_targets
+        # Determine target
+        if to is not None:
+            target = to
+        else:
+            target = self._job_alert_to
+        # Resolve to chat IDs
+        chat_ids = resolve_targets(
+            target,
+            self._tg_config.chats,
+            self._tg_config.default,
+            job_id=self._job_id,
+        )
+        if not chat_ids:
+            return  # No targets configured
+        # Send to each resolved chat
+        for chat_id in chat_ids:
+            effective_parse_mode = (
+                parse_mode if parse_mode is not None
+                else self._tg_config.parse_mode or "Markdown"
+            )
+            self._bot.send_message(
+                message,
+                chat_id=chat_id,
+                parse_mode=effective_parse_mode,
+                disable_web_page_preview=True,
+            )

brawny 0.1.13__py3-none-any.whl → 0.1.22__py3-none-any.whl

brawny 0.1.13py3-none-any.whl → 0.1.22py3-none-any.whl