PyPI - avtomatika - Versions diffs - 1.0b7__py3-none-any.whl → 1.0b8__py3-none-any.whl - Mend

avtomatika 1.0b7py3-none-any.whl → 1.0b8py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (26) hide show

avtomatika/app_keys.py +1 -0
avtomatika/config.py +10 -0
avtomatika/data_types.py +2 -1
avtomatika/dispatcher.py +8 -26
avtomatika/engine.py +19 -1
avtomatika/executor.py +34 -6
avtomatika/health_checker.py +23 -5
avtomatika/history/base.py +60 -6
avtomatika/history/noop.py +18 -7
avtomatika/history/postgres.py +8 -6
avtomatika/history/sqlite.py +7 -5
avtomatika/metrics.py +1 -1
avtomatika/reputation.py +46 -40
avtomatika/s3.py +323 -0
avtomatika/storage/base.py +45 -4
avtomatika/storage/memory.py +44 -6
avtomatika/storage/redis.py +185 -252
avtomatika/utils/webhook_sender.py +44 -2
avtomatika/watcher.py +33 -35
avtomatika/ws_manager.py +7 -6
{avtomatika-1.0b7.dist-info → avtomatika-1.0b8.dist-info}/METADATA +50 -2
avtomatika-1.0b8.dist-info/RECORD +46 -0
avtomatika-1.0b7.dist-info/RECORD +0 -45
{avtomatika-1.0b7.dist-info → avtomatika-1.0b8.dist-info}/WHEEL +0 -0
{avtomatika-1.0b7.dist-info → avtomatika-1.0b8.dist-info}/licenses/LICENSE +0 -0
{avtomatika-1.0b7.dist-info → avtomatika-1.0b8.dist-info}/top_level.txt +0 -0

avtomatika/storage/redis.py CHANGED Viewed

@@ -35,6 +35,12 @@ class RedisStorage(StorageBackend):
     def _get_key(self, job_id: str) -> str:
         return f"{self._prefix}:{job_id}"
+    async def get_worker_info(self, worker_id: str) -> dict[str, Any] | None:
+        """Gets the full info for a worker by its ID."""
+        key = f"orchestrator:worker:info:{worker_id}"
+        data = await self._redis.get(key)
+        return self._unpack(data) if data else None
     @staticmethod
     def _pack(data: Any) -> bytes:
         return packb(data, use_bin_type=True)
@@ -55,10 +61,8 @@ class RedisStorage(StorageBackend):
         key = f"orchestrator:task_queue:{worker_type}"
         pipe = self._redis.pipeline()
-        pipe.zcard(key)  # Get the number of elements
-        # Get the top 3 highest priority bids (scores)
+        pipe.zcard(key)
         pipe.zrange(key, -3, -1, withscores=True, score_cast_func=float)
-        # Get the top 3 lowest priority bids (scores)
         pipe.zrange(key, 0, 2, withscores=True, score_cast_func=float)
         results = await pipe.execute()
@@ -66,7 +70,6 @@ class RedisStorage(StorageBackend):
         top_bids = [score for _, score in reversed(top_bids_raw)]
         bottom_bids = [score for _, score in bottom_bids_raw]
-        # Simple average calculation, can be improved for large queues
         all_scores = [s for _, s in await self._redis.zrange(key, 0, -1, withscores=True, score_cast_func=float)]
         avg_bid = sum(all_scores) / len(all_scores) if all_scores else 0
@@ -102,8 +105,6 @@ class RedisStorage(StorageBackend):
                     await pipe.watch(key)
                     current_state_raw = await pipe.get(key)
                     current_state = self._unpack(current_state_raw) if current_state_raw else {}
-                    # Simple dictionary merge. For nested structures, a deep merge may be required.
                     current_state.update(update_data)
                     pipe.multi()
@@ -119,55 +120,46 @@ class RedisStorage(StorageBackend):
         worker_info: dict[str, Any],
         ttl: int,
     ) -> None:
-        """Registers a worker in Redis."""
+        """Registers a worker in Redis and updates indexes."""
         worker_info.setdefault("reputation", 1.0)
         key = f"orchestrator:worker:info:{worker_id}"
-        await self._redis.set(key, self._pack(worker_info), ex=ttl)
+        tasks_key = f"orchestrator:worker:tasks:{worker_id}"
-    async def enqueue_task_for_worker(
-        self,
-        worker_id: str,
-        task_payload: dict[str, Any],
-        priority: float,
-    ) -> None:
-        """Adds a task to the priority queue (Sorted Set) for a worker."""
-        key = f"orchestrator:task_queue:{worker_id}"
-        await self._redis.zadd(key, {self._pack(task_payload): priority})
+        async with self._redis.pipeline(transaction=True) as pipe:
+            pipe.set(key, self._pack(worker_info), ex=ttl)
+            pipe.sadd("orchestrator:index:workers:all", worker_id)
-    async def dequeue_task_for_worker(
-        self,
-        worker_id: str,
-        timeout: int,
-    ) -> dict[str, Any] | None:
-        """Retrieves the highest priority task from the queue (Sorted Set),
-        using the blocking BZPOPMAX operation.
-        """
-        key = f"orchestrator:task_queue:{worker_id}"
-        try:
-            # BZPOPMAX returns a tuple (key, member, score)
-            result = await self._redis.bzpopmax([key], timeout=timeout)
-            return self._unpack(result[1]) if result else None
-        except CancelledError:
-            return None
-        except ResponseError as e:
-            # Error handling if `fakeredis` does not support BZPOPMAX
-            if "unknown command" in str(e).lower() or "wrong number of arguments" in str(e).lower():
-                logger.warning(
-                    "BZPOPMAX is not supported (likely running with fakeredis). "
-                    "Falling back to non-blocking ZPOPMAX for testing.",
-                )
-                # Non-blocking fallback for tests
-                res = await self._redis.zpopmax(key)
-                if res:
-                    return self._unpack(res[0][0])
-            raise e
+            if worker_info.get("status", "idle") == "idle":
+                pipe.sadd("orchestrator:index:workers:idle", worker_id)
+            else:
+                pipe.srem("orchestrator:index:workers:idle", worker_id)
-    async def refresh_worker_ttl(self, worker_id: str, ttl: int) -> bool:
-        """Updates the TTL for a worker key using the EXPIRE command."""
+            supported_tasks = worker_info.get("supported_tasks", [])
+            if supported_tasks:
+                pipe.sadd(tasks_key, *supported_tasks)
+                for task in supported_tasks:
+                    pipe.sadd(f"orchestrator:index:workers:task:{task}", worker_id)
+            await pipe.execute()
+    async def deregister_worker(self, worker_id: str) -> None:
+        """Deletes the worker key and removes it from all indexes."""
         key = f"orchestrator:worker:info:{worker_id}"
-        # EXPIRE returns 1 if the TTL was set, and 0 if the key does not exist.
-        was_set = await self._redis.expire(key, ttl)  # type: ignore[misc]
-        return bool(was_set)
+        tasks_key = f"orchestrator:worker:tasks:{worker_id}"
+        tasks = await self._redis.smembers(tasks_key)  # type: ignore
+        async with self._redis.pipeline(transaction=True) as pipe:
+            pipe.delete(key)
+            pipe.delete(tasks_key)
+            pipe.srem("orchestrator:index:workers:all", worker_id)
+            pipe.srem("orchestrator:index:workers:idle", worker_id)
+            for task in tasks:
+                task_str = task.decode("utf-8") if isinstance(task, bytes) else task
+                pipe.srem(f"orchestrator:index:workers:task:{task_str}", worker_id)
+            await pipe.execute()
     async def update_worker_status(
         self,
@@ -184,102 +176,131 @@ class RedisStorage(StorageBackend):
                     return None
                 current_state = self._unpack(current_state_raw)
-                # Create a potential new state to compare against the current one
                 new_state = current_state.copy()
                 new_state.update(status_update)
                 pipe.multi()
-                # Only write to Redis if the state has actually changed.
                 if new_state != current_state:
                     pipe.set(key, self._pack(new_state), ex=ttl)
-                    current_state = new_state  # Update the state to be returned
+                    old_status = current_state.get("status", "idle")
+                    new_status = new_state.get("status", "idle")
+                    if old_status != new_status:
+                        if new_status == "idle":
+                            pipe.sadd("orchestrator:index:workers:idle", worker_id)
+                        else:
+                            pipe.srem("orchestrator:index:workers:idle", worker_id)
+                    current_state = new_state
                 else:
-                    # If nothing changed, just refresh the TTL to keep the worker alive.
                     pipe.expire(key, ttl)
                 await pipe.execute()
                 return current_state
             except WatchError:
-                # In case of a conflict, the operation can be repeated,
-                # but for a heartbeat it is not critical, you can just skip it.
                 return None
-    async def update_worker_data(
-        self,
-        worker_id: str,
-        update_data: dict[str, Any],
-    ) -> dict[str, Any] | None:
+    async def find_workers_for_task(self, task_type: str) -> list[str]:
+        """Finds idle workers that support the given task using set intersection."""
+        task_index = f"orchestrator:index:workers:task:{task_type}"
+        idle_index = "orchestrator:index:workers:idle"
+        worker_ids = await self._redis.sinter(task_index, idle_index)  # type: ignore
+        return [wid.decode("utf-8") if isinstance(wid, bytes) else wid for wid in worker_ids]
+    async def enqueue_task_for_worker(self, worker_id: str, task_payload: dict[str, Any], priority: float) -> None:
+        key = f"orchestrator:task_queue:{worker_id}"
+        await self._redis.zadd(key, {self._pack(task_payload): priority})
+    async def dequeue_task_for_worker(self, worker_id: str, timeout: int) -> dict[str, Any] | None:
+        key = f"orchestrator:task_queue:{worker_id}"
+        try:
+            result = await self._redis.bzpopmax([key], timeout=timeout)
+            return self._unpack(result[1]) if result else None
+        except CancelledError:
+            return None
+        except ResponseError as e:
+            if "unknown command" in str(e).lower() or "wrong number of arguments" in str(e).lower():
+                res = await self._redis.zpopmax(key)
+                if res:
+                    return self._unpack(res[0][0])
+            raise e
+    async def refresh_worker_ttl(self, worker_id: str, ttl: int) -> bool:
+        was_set = await self._redis.expire(f"orchestrator:worker:info:{worker_id}", ttl)
+        return bool(was_set)
+    async def update_worker_data(self, worker_id: str, update_data: dict[str, Any]) -> dict[str, Any] | None:
         key = f"orchestrator:worker:info:{worker_id}"
         async with self._redis.pipeline(transaction=True) as pipe:
             try:
                 await pipe.watch(key)
-                current_state_raw = await pipe.get(key)
-                if not current_state_raw:
+                raw = await pipe.get(key)
+                if not raw:
                     return None
-                current_state = self._unpack(current_state_raw)
-                current_state.update(update_data)
+                data = self._unpack(raw)
+                data.update(update_data)
                 pipe.multi()
-                # Do not set TTL, as this is a data update, not a heartbeat
-                pipe.set(key, self._pack(current_state))
+                pipe.set(key, self._pack(data))
                 await pipe.execute()
-                return current_state
+                return data
             except WatchError:
-                # In case of a conflict, the operation can be repeated
-                logger.warning(
-                    f"WatchError during worker data update for {worker_id}, retrying.",
-                )
-                # In this case, it is better to repeat, as updating the reputation is important
                 return await self.update_worker_data(worker_id, update_data)
     async def get_available_workers(self) -> list[dict[str, Any]]:
-        """Gets a list of active workers by scanning keys in Redis."""
-        worker_keys = [key async for key in self._redis.scan_iter("orchestrator:worker:info:*")]  # type: ignore[attr-defined]
+        worker_keys = [key async for key in self._redis.scan_iter("orchestrator:worker:info:*")]  # type: ignore
         if not worker_keys:
             return []
+        data_list = await self._redis.mget(worker_keys)
+        return [self._unpack(data) for data in data_list if data]
-        worker_data_list = await self._redis.mget(worker_keys)
-        return [self._unpack(data) for data in worker_data_list if data]
+    async def get_workers(self, worker_ids: list[str]) -> list[dict[str, Any]]:
+        if not worker_ids:
+            return []
+        keys = [f"orchestrator:worker:info:{wid}" for wid in worker_ids]
+        data_list = await self._redis.mget(keys)
+        return [self._unpack(data) for data in data_list if data]
+    async def get_active_worker_ids(self) -> list[str]:
+        worker_ids = await self._redis.smembers("orchestrator:index:workers:all")  # type: ignore
+        return [wid.decode("utf-8") if isinstance(wid, bytes) else wid for wid in worker_ids]
+    async def cleanup_expired_workers(self) -> None:
+        worker_ids = await self.get_active_worker_ids()
+        if not worker_ids:
+            return
+        pipe = self._redis.pipeline()
+        for wid in worker_ids:
+            pipe.exists(f"orchestrator:worker:info:{wid}")
+        existence = await pipe.execute()
+        dead_ids = [worker_ids[i] for i, exists in enumerate(existence) if not exists]
+        for wid in dead_ids:
+            tasks = await self._redis.smembers(f"orchestrator:worker:tasks:{wid}")  # type: ignore
+            async with self._redis.pipeline(transaction=True) as p:
+                p.delete(f"orchestrator:worker:tasks:{wid}")
+                p.srem("orchestrator:index:workers:all", wid)
+                p.srem("orchestrator:index:workers:idle", wid)
+                for t in tasks:
+                    p.srem(f"orchestrator:index:workers:task:{t.decode() if isinstance(t, bytes) else t}", wid)
+                await p.execute()
     async def add_job_to_watch(self, job_id: str, timeout_at: float) -> None:
-        """Adds a job to a Redis sorted set.
-        The score is the timeout time.
-        """
         await self._redis.zadd("orchestrator:watched_jobs", {job_id: timeout_at})
     async def remove_job_from_watch(self, job_id: str) -> None:
-        """Removes a job from the sorted set for tracking."""
         await self._redis.zrem("orchestrator:watched_jobs", job_id)
-    async def get_timed_out_jobs(self) -> list[str]:
-        """Finds and removes overdue jobs from the sorted set."""
+    async def get_timed_out_jobs(self, limit: int = 100) -> list[str]:
         now = get_running_loop().time()
-        # Find all jobs with a timeout up to the current moment
-        timed_out_ids = await self._redis.zrangebyscore(
-            "orchestrator:watched_jobs",
-            0,
-            now,
-        )
-        if timed_out_ids:
-            # Atomically remove the found IDs
-            await self._redis.zrem("orchestrator:watched_jobs", *timed_out_ids)  # type: ignore[arg-type]
-            return [job_id.decode("utf-8") for job_id in timed_out_ids]
+        ids = await self._redis.zrangebyscore("orchestrator:watched_jobs", 0, now, start=0, num=limit)
+        if ids:
+            await self._redis.zrem("orchestrator:watched_jobs", *ids)  # type: ignore
+            return [i.decode("utf-8") for i in ids]
         return []
     async def enqueue_job(self, job_id: str) -> None:
-        """Adds a job to the Redis stream."""
         await self._redis.xadd(self._stream_key, {"job_id": job_id})
-    async def dequeue_job(self) -> tuple[str, str] | None:
-        """Retrieves a job from the Redis stream using consumer groups.
-        Implements a recovery strategy: checks for pending messages first.
-        """
+    async def dequeue_job(self, block: int | None = None) -> tuple[str, str] | None:
         if not self._group_created:
             try:
                 await self._redis.xgroup_create(self._stream_key, self._group_name, id="0", mkstream=True)
@@ -287,79 +308,39 @@ class RedisStorage(StorageBackend):
                 if "BUSYGROUP" not in str(e):
                     raise e
             self._group_created = True
         try:
-            try:
-                autoclaim_result = await self._redis.xautoclaim(
-                    self._stream_key,
-                    self._group_name,
-                    self._consumer_name,
-                    min_idle_time=self._min_idle_time_ms,
-                    start_id="0-0",
-                    count=1,
-                )
-                if autoclaim_result and autoclaim_result[1]:
-                    messages = autoclaim_result[1]
-                    message_id, data = messages[0]
-                    if data:
-                        job_id = data[b"job_id"].decode("utf-8")
-                        logger.info(f"Reclaimed pending message {message_id} for consumer {self._consumer_name}")
-                        return job_id, message_id.decode("utf-8")
-            except Exception as e:
-                if "unknown command" in str(e).lower() or isinstance(e, ResponseError):
-                    pending_result = await self._redis.xreadgroup(
-                        self._group_name,
-                        self._consumer_name,
-                        {self._stream_key: "0"},
-                        count=1,
-                    )
-                    if pending_result:
-                        stream_name, messages = pending_result[0]
-                        if messages:
-                            message_id, data = messages[0]
-                            job_id = data[b"job_id"].decode("utf-8")
-                            return job_id, message_id.decode("utf-8")
-                else:
-                    raise e
-            result = await self._redis.xreadgroup(
+            claim = await self._redis.xautoclaim(
+                self._stream_key,
                 self._group_name,
                 self._consumer_name,
-                {self._stream_key: ">"},
+                min_idle_time=self._min_idle_time_ms,
+                start_id="0-0",
                 count=1,
             )
-            if result:
-                stream_name, messages = result[0]
-                message_id, data = messages[0]
-                job_id = data[b"job_id"].decode("utf-8")
-                return job_id, message_id.decode("utf-8")
+            if claim and claim[1]:
+                msg_id, data = claim[1][0]
+                return data[b"job_id"].decode("utf-8"), msg_id.decode("utf-8")
+            read = await self._redis.xreadgroup(
+                self._group_name, self._consumer_name, {self._stream_key: ">"}, count=1, block=block
+            )
+            if read:
+                msg_id, data = read[0][1][0]
+                return data[b"job_id"].decode("utf-8"), msg_id.decode("utf-8")
             return None
         except CancelledError:
             return None
     async def ack_job(self, message_id: str) -> None:
-        """Acknowledges a message in the Redis stream."""
         await self._redis.xack(self._stream_key, self._group_name, message_id)
     async def quarantine_job(self, job_id: str) -> None:
-        """Moves the job ID to the 'quarantine' list in Redis."""
-        await self._redis.lpush("orchestrator:quarantine_queue", job_id)  # type: ignore[arg-type]
+        await self._redis.lpush("orchestrator:quarantine_queue", job_id)  # type: ignore
     async def get_quarantined_jobs(self) -> list[str]:
-        """Gets all job IDs from the quarantine queue."""
-        jobs_bytes = await self._redis.lrange("orchestrator:quarantine_queue", 0, -1)
-        return [job.decode("utf-8") for job in jobs_bytes]
-    async def deregister_worker(self, worker_id: str) -> None:
-        """Deletes the worker key from Redis."""
-        key = f"orchestrator:worker:info:{worker_id}"
-        await self._redis.delete(key)
+        jobs = await self._redis.lrange("orchestrator:quarantine_queue", 0, -1)
+        return [j.decode("utf-8") for j in jobs]
     async def increment_key_with_ttl(self, key: str, ttl: int) -> int:
-        """Atomically increments a counter and sets a TTL on the first call,
-        using a Lua script for atomicity.
-        Returns the new value of the counter.
-        """
         async with self._redis.pipeline(transaction=True) as pipe:
             pipe.incr(key)
             pipe.expire(key, ttl)
@@ -367,144 +348,96 @@ class RedisStorage(StorageBackend):
             return results[0]
     async def save_client_config(self, token: str, config: dict[str, Any]) -> None:
-        """Saves the static client configuration as a hash."""
-        key = f"orchestrator:client_config:{token}"
-        # Convert all values to binary strings for storage in a Redis hash
-        str_config = {k: self._pack(v) for k, v in config.items()}
-        await self._redis.hset(key, mapping=str_config)
+        await self._redis.hset(
+            f"orchestrator:client_config:{token}", mapping={k: self._pack(v) for k, v in config.items()}
+        )
     async def get_client_config(self, token: str) -> dict[str, Any] | None:
-        """Gets the static client configuration."""
-        key = f"orchestrator:client_config:{token}"
-        config_raw = await self._redis.hgetall(key)  # type: ignore[misc]
-        if not config_raw:
+        raw = await self._redis.hgetall(f"orchestrator:client_config:{token}")  # type: ignore
+        if not raw:
             return None
-        # Decode keys and values, parse binary
-        return {k.decode("utf-8"): self._unpack(v) for k, v in config_raw.items()}
+        return {k.decode("utf-8"): self._unpack(v) for k, v in raw.items()}
     async def initialize_client_quota(self, token: str, quota: int) -> None:
-        """Sets or resets the quota counter."""
-        key = f"orchestrator:quota:{token}"
-        await self._redis.set(key, quota)
+        await self._redis.set(f"orchestrator:quota:{token}", quota)
     async def check_and_decrement_quota(self, token: str) -> bool:
-        """Atomically checks and decrements the quota. Returns True if successful."""
         key = f"orchestrator:quota:{token}"
-        LUA_SCRIPT = """
-        local current = redis.call('GET', KEYS[1])
-        if current and tonumber(current) > 0 then
-            redis.call('DECR', KEYS[1])
-            return 1
-        else
-            return 0
-        end
-        """
+        LUA = (
+            "local c = redis.call('GET', KEYS[1]) "
+            "if c and tonumber(c) > 0 then redis.call('DECR', KEYS[1]) return 1 else return 0 end"
+        )
         try:
-            # This is the most efficient path for a real Redis server.
-            # It loads the script once and then executes it by its SHA hash.
-            sha = await self._redis.script_load(LUA_SCRIPT)
-            result = await self._redis.evalsha(sha, 1, key)
+            sha = await self._redis.script_load(LUA)
+            res = await self._redis.evalsha(sha, 1, key)
         except NoScriptError:
-            # If the script is not in the cache, Redis raises NoScriptError.
-            # We can then fall back to executing the full script.
-            result = await self._redis.eval(LUA_SCRIPT, 1, key)
+            res = await self._redis.eval(LUA, 1, key)
         except ResponseError as e:
-            # This is the fallback path for `fakeredis` used in tests, which
-            # does not support `SCRIPT LOAD` or `EVALSHA`. It raises a
-            # ResponseError: "unknown command `script`".
             if "unknown command" in str(e):
-                # We resort to a non-atomic GET/DECR for testing purposes.
-                # This is not safe for production but allows tests to pass.
-                current_val = await self._redis.get(key)
-                if current_val and int(current_val) > 0:
+                cur = await self._redis.get(key)
+                if cur and int(cur) > 0:
                     await self._redis.decr(key)
                     return True
                 return False
-            # If it's a different ResponseError, re-raise it.
             raise
-        return bool(result)
+        return bool(res)
     async def flush_all(self):
-        """Completely clears the current Redis database.
-        WARNING: This operation will delete ALL keys in the current DB.
-        Use for testing purposes only.
-        """
-        logger.warning("Flushing all data from Redis database.")
         await self._redis.flushdb()
     async def get_job_queue_length(self) -> int:
-        """Returns the length of the job stream."""
         return await self._redis.xlen(self._stream_key)
     async def get_active_worker_count(self) -> int:
-        """Returns the number of active worker keys."""
-        count = 0
+        c = 0
         async for _ in self._redis.scan_iter("orchestrator:worker:info:*"):
-            count += 1
-        return count
+            c += 1
+        return c
     async def set_nx_ttl(self, key: str, value: str, ttl: int) -> bool:
-        """
-        Uses Redis SET command with NX (Not Exists) and EX (Expire) options.
-        """
-        # redis.set returns True if set, None if not set (when nx=True)
-        result = await self._redis.set(key, value, nx=True, ex=ttl)
-        return bool(result)
+        return bool(await self._redis.set(key, value, nx=True, ex=ttl))
     async def get_str(self, key: str) -> str | None:
         val = await self._redis.get(key)
-        if val is None:
-            return None
-        return val.decode("utf-8") if isinstance(val, bytes) else str(val)
+        return val.decode("utf-8") if isinstance(val, bytes) else str(val) if val is not None else None
     async def set_str(self, key: str, value: str, ttl: int | None = None) -> None:
         await self._redis.set(key, value, ex=ttl)
     async def set_worker_token(self, worker_id: str, token: str):
-        """Stores the individual token for a specific worker."""
-        key = f"orchestrator:worker:token:{worker_id}"
-        await self._redis.set(key, token)
+        await self._redis.set(f"orchestrator:worker:token:{worker_id}", token)
     async def get_worker_token(self, worker_id: str) -> str | None:
-        """Retrieves the individual token for a specific worker."""
-        key = f"orchestrator:worker:token:{worker_id}"
-        token = await self._redis.get(key)
+        token = await self._redis.get(f"orchestrator:worker:token:{worker_id}")
         return token.decode("utf-8") if token else None
-    async def get_worker_info(self, worker_id: str) -> dict[str, Any] | None:
-        """Gets the full info for a worker by its ID."""
-        key = f"orchestrator:worker:info:{worker_id}"
-        data = await self._redis.get(key)
-        return self._unpack(data) if data else None
     async def acquire_lock(self, key: str, holder_id: str, ttl: int) -> bool:
-        """Attempts to acquire a lock using Redis SET NX."""
-        redis_key = f"orchestrator:lock:{key}"
-        result = await self._redis.set(redis_key, holder_id, nx=True, ex=ttl)
-        return bool(result)
+        return bool(await self._redis.set(f"orchestrator:lock:{key}", holder_id, nx=True, ex=ttl))
     async def release_lock(self, key: str, holder_id: str) -> bool:
-        """Releases the lock using a Lua script to ensure ownership."""
-        redis_key = f"orchestrator:lock:{key}"
-        LUA_RELEASE_SCRIPT = """
-        if redis.call("get", KEYS[1]) == ARGV[1] then
-            return redis.call("del", KEYS[1])
-        else
-            return 0
-        end
-        """
+        LUA = "if redis.call('get', KEYS[1]) == ARGV[1] then return redis.call('del', KEYS[1]) else return 0 end"
         try:
-            result = await self._redis.eval(LUA_RELEASE_SCRIPT, 1, redis_key, holder_id)
-            return bool(result)
+            return bool(await self._redis.eval(LUA, 1, f"orchestrator:lock:{key}", holder_id))
         except ResponseError as e:
             if "unknown command" in str(e):
-                current_val = await self._redis.get(redis_key)
-                if current_val and current_val.decode("utf-8") == holder_id:
-                    await self._redis.delete(redis_key)
+                cur = await self._redis.get(f"orchestrator:lock:{key}")
+                if cur and cur.decode("utf-8") == holder_id:
+                    await self._redis.delete(f"orchestrator:lock:{key}")
                     return True
                 return False
             raise e
+    async def ping(self) -> bool:
+        try:
+            return await self._redis.ping()
+        except Exception:
+            return False
+    async def reindex_workers(self) -> None:
+        """Scan existing worker keys and rebuild indexes."""
+        async for key in self._redis.scan_iter("orchestrator:worker:info:*"):  # type: ignore
+            worker_id = key.decode("utf-8").split(":")[-1]
+            raw = await self._redis.get(key)
+            if raw:
+                info = self._unpack(raw)
+                await self.register_worker(worker_id, info, int(await self._redis.ttl(key)))

avtomatika/utils/webhook_sender.py CHANGED Viewed

@@ -1,4 +1,5 @@
-from asyncio import sleep
+from asyncio import CancelledError, Queue, QueueFull, create_task, sleep
+from contextlib import suppress
 from dataclasses import asdict, dataclass
 from logging import getLogger
 from typing import Any
@@ -22,8 +23,49 @@ class WebhookSender:
         self.session = session
         self.timeout = ClientTimeout(total=10)
         self.max_retries = 3
+        self._queue: Queue[tuple[str, WebhookPayload]] = Queue(maxsize=1000)
+        self._worker_task = None
-    async def send(self, url: str, payload: WebhookPayload) -> bool:
+    def start(self) -> None:
+        if not self._worker_task:
+            self._worker_task = create_task(self._worker())
+            logger.info("WebhookSender background worker started.")
+    async def stop(self) -> None:
+        if self._worker_task:
+            self._worker_task.cancel()
+            with suppress(CancelledError):
+                await self._worker_task
+            self._worker_task = None
+            logger.info("WebhookSender background worker stopped.")
+    async def send(self, url: str, payload: WebhookPayload) -> None:
+        """
+        Queues a webhook to be sent. Non-blocking.
+        Drops the message if the queue is full to prevent backpressure.
+        """
+        try:
+            self._queue.put_nowait((url, payload))
+        except QueueFull:
+            logger.error(
+                f"Webhook queue is full! Dropping webhook for job {payload.job_id} to {url}. "
+                "Consider increasing queue size or checking external service latency."
+            )
+    async def _worker(self) -> None:
+        while True:
+            try:
+                url, payload = await self._queue.get()
+                try:
+                    await self._send_single(url, payload)
+                except Exception as e:
+                    logger.exception(f"Unexpected error in webhook worker: {e}")
+                finally:
+                    self._queue.task_done()
+            except CancelledError:
+                break
+    async def _send_single(self, url: str, payload: WebhookPayload) -> bool:
         """
         Sends a webhook payload to the specified URL with retries.
         Returns True if successful, False otherwise.

avtomatika 1.0b7__py3-none-any.whl → 1.0b8__py3-none-any.whl

avtomatika 1.0b7py3-none-any.whl → 1.0b8py3-none-any.whl