PyPI - puda-comms - Versions diffs - 0.0.4__py3-none-any.whl → 0.0.5__py3-none-any.whl - Mend

puda-comms 0.0.4py3-none-any.whl → 0.0.5py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (8) hide show

puda_comms/command_service.py +202 -67
puda_comms/machine_client.py +134 -82
puda_comms/models.py +3 -0
puda_comms/run_manager.py +112 -0
{puda_comms-0.0.4.dist-info → puda_comms-0.0.5.dist-info}/METADATA +1 -1
puda_comms-0.0.5.dist-info/RECORD +9 -0
puda_comms-0.0.4.dist-info/RECORD +0 -8
{puda_comms-0.0.4.dist-info → puda_comms-0.0.5.dist-info}/WHEEL +0 -0

puda_comms/command_service.py CHANGED Viewed

@@ -16,7 +16,13 @@ from typing import Dict, Any, Optional
 import nats
 from nats.js.client import JetStreamContext
 from nats.aio.msg import Msg
-from puda_comms.models import CommandRequest, CommandResponseStatus, NATSMessage, MessageHeader, MessageType
+from puda_comms.models import (
+    CommandRequest,
+    CommandResponseStatus,
+    NATSMessage,
+    MessageHeader,
+    MessageType,
+)
 logger = logging.getLogger(__name__)
@@ -266,9 +272,9 @@ class CommandService:
         max_attempts = 3
         connect_timeout = 3  # 3 seconds timeout per connection attempt
-        for attempt in range(1, max_attempts + 1):
+        for attempt in range(max_attempts):
             try:
-                logger.info("Connection attempt %d/%d to NATS servers: %s", attempt, max_attempts, self.servers)
+                logger.info("Connection attempt %d/%d to NATS servers: %s", attempt + 1, max_attempts, self.servers)
                 self.nc = await asyncio.wait_for(
                     nats.connect(
                         servers=self.servers,
@@ -285,14 +291,14 @@ class CommandService:
                 return True
             except asyncio.TimeoutError:
-                logger.warning("Connection attempt %d/%d timed out after %d seconds", attempt, max_attempts, connect_timeout)
-                if attempt < max_attempts:
+                logger.warning("Connection attempt %d/%d timed out after %d seconds", attempt + 1, max_attempts, connect_timeout)
+                if attempt < max_attempts - 1:
                     logger.info("Retrying connection...")
                 else:
                     logger.error("Failed to connect after %d attempts. Giving up.", max_attempts)
             except Exception as e:
-                logger.warning("Connection attempt %d/%d failed: %s", attempt, max_attempts, e)
-                if attempt < max_attempts:
+                logger.warning("Connection attempt %d/%d failed: %s", attempt + 1, max_attempts, e)
+                if attempt < max_attempts - 1:
                     logger.info("Retrying connection...")
                 else:
                     logger.error("Failed to connect after %d attempts. Giving up.", max_attempts)
@@ -408,6 +414,76 @@ class CommandService:
             response_handler.remove_pending(run_id, request.step_number)
             return None
+    async def start_run(
+        self,
+        machine_id: str,
+        run_id: str,
+        user_id: str,
+        username: str,
+        timeout: int = 120
+    ) -> Optional[NATSMessage]:
+        """
+        Send START immediate command to begin a run.
+        Args:
+            machine_id: Machine ID to send the command to
+            run_id: Run ID for the command
+            user_id: User ID who initiated the command
+            username: Username who initiated the command
+            timeout: Maximum time to wait for response in seconds
+        Returns:
+            NATSMessage if successful, None if failed or timeout
+        """
+        request = CommandRequest(
+            name="start",
+            params={},
+            step_number=0
+        )
+        return await self.send_immediate_command(
+            request=request,
+            machine_id=machine_id,
+            run_id=run_id,
+            user_id=user_id,
+            username=username,
+            timeout=timeout
+        )
+    async def complete_run(
+        self,
+        machine_id: str,
+        run_id: str,
+        user_id: str,
+        username: str,
+        timeout: int = 120
+    ) -> Optional[NATSMessage]:
+        """
+        Send COMPLETE immediate command to end a run.
+        Args:
+            machine_id: Machine ID to send the command to
+            run_id: Run ID for the command
+            user_id: User ID who initiated the command
+            username: Username who initiated the command
+            timeout: Maximum time to wait for response in seconds
+        Returns:
+            NATSMessage if successful, None if failed or timeout
+        """
+        request = CommandRequest(
+            name="complete",
+            params={},
+            step_number=0
+        )
+        return await self.send_immediate_command(
+            request=request,
+            machine_id=machine_id,
+            run_id=run_id,
+            user_id=user_id,
+            username=username,
+            timeout=timeout
+        )
     async def send_queue_commands(
         self,
         *,
@@ -421,9 +497,10 @@ class CommandService:
         """
         Send multiple queue commands sequentially and wait for responses.
-        Sends commands one by one, waiting for each response before sending the next.
-        If any command fails or times out, stops immediately and returns the error response.
-        If all commands succeed, returns the last command's response.
+        Automatically sends START command before the sequence and COMPLETE command after
+        successful completion. Sends commands one by one, waiting for each response before
+        sending the next. If any command fails or times out, stops immediately and returns
+        the error response. If all commands succeed, returns the last command's response.
         Args:
             requests: List of CommandRequest models to send sequentially
@@ -451,76 +528,131 @@ class CommandService:
             run_id
         )
+        # Always send START command before sequence
+        logger.info("Sending START command before sequence")
+        start_response = await self.start_run(
+            machine_id=machine_id,
+            run_id=run_id,
+            user_id=user_id,
+            username=username,
+            timeout=timeout
+        )
+        if start_response is None:
+            logger.error("START command timed out")
+            return None
+        if start_response.response and start_response.response.status == CommandResponseStatus.ERROR:
+            logger.error("START command failed: %s", start_response.response.message)
+            return start_response
         last_response: Optional[NATSMessage] = None
-        for idx, request in enumerate(requests, start=1):
-            logger.info(
-                "Sending command %d/%d: %s (step %s)",
-                idx,
-                len(requests),
-                request.name,
-                request.step_number
-            )
-            response = await self.send_queue_command(
-                request=request,
-                machine_id=machine_id,
-                run_id=run_id,
-                user_id=user_id,
-                username=username,
-                timeout=timeout
-            )
-            # Check if command failed (None means timeout or exception)
-            if response is None:
-                logger.error(
-                    "Command %d/%d failed or timed out: %s (step %s)",
+        try:
+            for idx, request in enumerate(requests, start=1):
+                # Validate request - convert dict to CommandRequest if needed
+                if isinstance(request, dict):
+                    request = CommandRequest.model_validate(request)
+                elif not isinstance(request, CommandRequest):
+                    raise ValueError(f"Request {idx} must be a CommandRequest or dict, got {type(request)}")
+                logger.info(
+                    "Sending command %d/%d: %s (step %s)",
                     idx,
                     len(requests),
                     request.name,
                     request.step_number
                 )
-                return None
-            # Check if command returned an error status
-            if response.response is not None:
-                if response.response.status == CommandResponseStatus.ERROR:
+                response = await self.send_queue_command(
+                    request=request,
+                    machine_id=machine_id,
+                    run_id=run_id,
+                    user_id=user_id,
+                    username=username,
+                    timeout=timeout
+                )
+                # Check if command failed (None means timeout or exception)
+                if response is None:
                     logger.error(
-                        "Command %d/%d failed with error: %s (step %s) - code: %s, message: %s",
+                        "Command %d/%d failed or timed out: %s (step %s)",
+                        idx,
+                        len(requests),
+                        request.name,
+                        request.step_number
+                    )
+                    return None
+                # Check if command returned an error status
+                if response.response is not None:
+                    if response.response.status == CommandResponseStatus.ERROR:
+                        logger.error(
+                            "Command %d/%d failed with error: %s (step %s) - code: %s, message: %s",
+                            idx,
+                            len(requests),
+                            request.name,
+                            request.step_number,
+                            response.response.code,
+                            response.response.message
+                        )
+                        return response
+                    # Command succeeded, store as last response
+                    last_response = response
+                    logger.info(
+                        "Command %d/%d succeeded: %s (step %s)",
+                        idx,
+                        len(requests),
+                        request.name,
+                        request.step_number
+                    )
+                else:
+                    # Response exists but has no response data (shouldn't happen, but handle it)
+                    logger.warning(
+                        "Command %d/%d returned response with no response data: %s (step %s)",
                         idx,
                         len(requests),
                         request.name,
-                        request.step_number,
-                        response.response.code,
-                        response.response.message
+                        request.step_number
                     )
                     return response
-                # Command succeeded, store as last response
-                last_response = response
-                logger.info(
-                    "Command %d/%d succeeded: %s (step %s)",
-                    idx,
-                    len(requests),
-                    request.name,
-                    request.step_number
-                )
-            else:
-                # Response exists but has no response data (shouldn't happen, but handle it)
-                logger.warning(
-                    "Command %d/%d returned response with no response data: %s (step %s)",
-                    idx,
-                    len(requests),
-                    request.name,
-                    request.step_number
+            logger.info(
+                "All %d commands completed successfully",
+                len(requests)
+            )
+            # Always send COMPLETE command after successful sequence
+            logger.info("Sending COMPLETE command after successful sequence")
+            complete_response = await self.complete_run(
+                machine_id=machine_id,
+                run_id=run_id,
+                user_id=user_id,
+                username=username,
+                timeout=timeout
+            )
+            if complete_response is None:
+                logger.error("COMPLETE command timed out")
+                return None
+            if complete_response.response and complete_response.response.status == CommandResponseStatus.ERROR:
+                logger.error("COMPLETE command failed: %s", complete_response.response.message)
+                return complete_response
+            # Return the last command response, not the COMPLETE response
+            return last_response
+        except Exception as e:
+            # If any error occurs during command execution, try to complete the run
+            # to clean up state (but don't fail if this also fails)
+            logger.warning("Error during command sequence, attempting to complete run: %s", e)
+            try:
+                await self.complete_run(
+                    machine_id=machine_id,
+                    run_id=run_id,
+                    user_id=user_id,
+                    username=username,
+                    timeout=timeout
                 )
-                return response
-        logger.info(
-            "All %d commands completed successfully",
-            len(requests)
-        )
-        return last_response
+            except Exception as cleanup_error:
+                logger.error("Failed to complete run during error cleanup: %s", cleanup_error)
+            raise
     async def send_immediate_command(
         self,
@@ -651,13 +783,16 @@ class CommandService:
         Args:
             command_request: CommandRequest model containing command details
             machine_id: Machine ID for the command
-            run_id: Run ID for the command
+            run_id: Run ID for the command (empty string will be converted to None)
             user_id: User ID who initiated the command
             username: Username who initiated the command
         Returns:
             NATSMessage object ready for NATS transmission
         """
+        # Convert empty string to None for run_id
+        run_id_value = run_id if run_id else None
         header = MessageHeader(
             message_type=MessageType.COMMAND,
             version="1.0",
@@ -665,7 +800,7 @@ class CommandService:
             user_id=user_id,
             username=username,
             machine_id=machine_id,
-            run_id=run_id
+            run_id=run_id_value
         )
         return NATSMessage(

puda_comms/machine_client.py CHANGED Viewed

@@ -19,6 +19,7 @@ from puda_comms.models import (
     MessageType,
     ImmediateCommand,
 )
+from puda_comms.run_manager import RunManager
 from nats.js.client import JetStreamContext
 from nats.js.api import StreamConfig, ConsumerConfig
 from nats.js.errors import NotFoundError
@@ -80,7 +81,9 @@ class MachineClient:
         # Queue control state
         self._pause_lock = asyncio.Lock()
         self._is_paused = False
-        self._cancelled_run_ids = set()
+        # Run state management
+        self.run_manager = RunManager(machine_id=machine_id)
     def _init_subjects(self):
         """Initialize all subject and stream names."""
@@ -423,7 +426,7 @@ class MachineClient:
             logger.error("Error publishing command response: %s", e)
     async def process_queue_cmd(
-        self,
+        self,
         msg: Msg,
         handler: Callable[[NATSMessage], Awaitable[CommandResponse]]
     ) -> None:
@@ -432,32 +435,26 @@ class MachineClient:
         Args:
             msg: NATS message
-            handler: Handler function that processes the message and returns CommandResponse
+            handler: Handler function that processes the message and returns a CommandResponse object
         """
+        # Initialize variables for exception handlers
+        run_id = None
+        step_number = None
+        command = None
         try:
             # Parse message
             message = NATSMessage.model_validate_json(msg.data)
             run_id = message.header.run_id
-            step_number = message.command.step_number
-            command = message.command.name
+            step_number = message.command.step_number if message.command else None
+            command = message.command.name if message.command else None
-            # Check if cancelled
-            if run_id and run_id in self._cancelled_run_ids:
-                logger.info("Skipping cancelled command: run_id=%s, step_number=%s, command=%s", run_id, step_number, command)
-                await msg.ack()
-                await self._publish_command_response(
-                    msg=msg,
-                    response=CommandResponse(
-                        status=CommandResponseStatus.ERROR,
-                        code=CommandResponseCode.COMMAND_CANCELLED,
-                        message='Command cancelled'
-                    ),
-                    subject=self.response_queue
-                )
-                # Note: Final state update should be published by the handler with machine-specific data
-                return
+            # For all commands, continue with normal processing:
+            # 1. Check if paused
+            # 2. Validate run_id matches active run
+            # 3. Execute handler
-            # Check if paused (for queue messages)
+            # If machine is paused, publish error response and return
             async with self._pause_lock:
                 if self._is_paused:
                     await self._publish_command_response(
@@ -470,24 +467,42 @@ class MachineClient:
                         subject=self.response_queue
                     )
                     return
-                while self._is_paused:
-                    await msg.in_progress()
-                    await asyncio.sleep(1)
-                    # Re-check cancelled state in case it was cancelled while paused
-                    if run_id and run_id in self._cancelled_run_ids:
-                        logger.info("Command cancelled while paused: run_id=%s, step_number=%s, command=%s", run_id, step_number, command)
-                        await msg.ack()
-                        await self._publish_command_response(
-                            msg=msg,
-                            response=CommandResponse(
-                                status=CommandResponseStatus.ERROR,
-                                code=CommandResponseCode.COMMAND_CANCELLED,
-                                message='Command cancelled'
-                            ),
-                            subject=self.response_queue
-                        )
-                        # Note: Final state update should be published by the handler with machine-specific data
-                        return
+            # Wait while paused (release lock during wait so RESUME can acquire it)
+            while True:
+                async with self._pause_lock:
+                    if not self._is_paused:
+                        break
+                # Release lock before sleeping so RESUME can set _is_paused = False
+                await msg.in_progress()
+                await asyncio.sleep(1)
+            # Validate run_id matches active run (run_id is required)
+            if run_id is None:
+                await msg.ack()
+                await self._publish_command_response(
+                    msg=msg,
+                    response=CommandResponse(
+                        status=CommandResponseStatus.ERROR,
+                        code=CommandResponseCode.EXECUTION_ERROR,
+                        message='Command requires run_id'
+                    ),
+                    subject=self.response_queue
+                )
+                return
+            if not await self.run_manager.validate_run_id(run_id):
+                await msg.ack()
+                await self._publish_command_response(
+                    msg=msg,
+                    response=CommandResponse(
+                        status=CommandResponseStatus.ERROR,
+                        code=CommandResponseCode.RUN_ID_MISMATCH,
+                        message=f'Run ID mismatch: expected active run, got {run_id}'
+                    ),
+                    subject=self.response_queue
+                )
+                return
             # Execute handler with auto-heartbeat (task might take a while for machine to complete)
             # The handler should be defined in the machine-specific edge module.
@@ -539,34 +554,19 @@ class MachineClient:
             # This is a rare case - consider if handler should be called with None payload
         except Exception as e:
-            # Check if cancelled before sending error response
-            if run_id and run_id in self._cancelled_run_ids:
-                logger.info("Command cancelled during execution (exception occurred): run_id=%s, step_number=%s, command=%s", run_id, step_number, command)
-                await msg.ack()
-                await self._publish_command_response(
-                    msg=msg,
-                    response=CommandResponse(
-                        status=CommandResponseStatus.ERROR,
-                        code=CommandResponseCode.COMMAND_CANCELLED,
-                        message='Command cancelled'
-                    ),
-                    subject=self.response_queue
-                )
-                # Note: Final state update should be published by the handler with machine-specific data
-            else:
-                # Terminate all errors to prevent infinite redelivery loops
-                logger.error("Handler failed (terminating message): %s", e)
-                await msg.term()
-                await self._publish_command_response(
-                    msg=msg,
-                    response=CommandResponse(
-                        status=CommandResponseStatus.ERROR,
-                        code=CommandResponseCode.EXECUTION_ERROR,
-                        message=str(e)
-                    ),
-                    subject=self.response_queue
-                )
-                # Note: Final state update should be published by the handler with machine-specific data
+            # Terminate all errors to prevent infinite redelivery loops
+            logger.error("Handler failed (terminating message): %s", e)
+            await msg.term()
+            await self._publish_command_response(
+                msg=msg,
+                response=CommandResponse(
+                    status=CommandResponseStatus.ERROR,
+                    code=CommandResponseCode.EXECUTION_ERROR,
+                    message=str(e)
+                ),
+                subject=self.response_queue
+            )
+            # Note: Final state update should be published by the handler with machine-specific data
     async def process_immediate_cmd(self, msg: Msg, handler: Callable[[CommandRequest], Awaitable[CommandResponse]]) -> None:
         """Process immediate commands (pause, cancel, resume, etc.)."""
@@ -581,8 +581,49 @@ class MachineClient:
                 return
             command_name = message.command.name.lower()
+            run_id = message.header.run_id
+            response: CommandResponse
             match command_name:
+                case ImmediateCommand.START:
+                    if run_id:
+                        success = await self.run_manager.start_run(run_id)
+                        if not success:
+                            # Run already active
+                            response = CommandResponse(
+                                status=CommandResponseStatus.ERROR,
+                                code=CommandResponseCode.RUN_ID_MISMATCH,
+                                message='cannot start, another run is currently running'
+                            )
+                        else:
+                            await self.publish_state({'state': 'active', 'run_id': run_id})
+                            response = CommandResponse(status=CommandResponseStatus.SUCCESS)
+                    else:
+                        response = CommandResponse(
+                            status=CommandResponseStatus.ERROR,
+                            code=CommandResponseCode.MISSING_RUN_ID,
+                            message='START command requires RUN_ID'
+                        )
+                case ImmediateCommand.COMPLETE:
+                    if not run_id:
+                        response = CommandResponse(
+                            status=CommandResponseStatus.ERROR,
+                            code=CommandResponseCode.MISSING_RUN_ID,
+                            message='COMPLETE command requires RUN_ID'
+                        )
+                    else:
+                        success = await self.run_manager.complete_run(run_id)
+                        if success:
+                            await self.publish_state({'state': 'idle', 'run_id': None})
+                            response = CommandResponse(status=CommandResponseStatus.SUCCESS)
+                        else:
+                            response = CommandResponse(
+                                status=CommandResponseStatus.ERROR,
+                                code=CommandResponseCode.RUN_ID_MISMATCH,
+                                message=f'Run {run_id} not active'
+                            )
                 case ImmediateCommand.PAUSE:
                     async with self._pause_lock:
                         if not self._is_paused:
@@ -590,7 +631,7 @@ class MachineClient:
                             logger.info("Queue paused")
                             await self.publish_state({'state': 'paused', 'run_id': message.header.run_id})
                     # Call handler and use its response
-                    response: CommandResponse = await handler(message)
+                    response = await handler(message)
                 case ImmediateCommand.RESUME:
                     async with self._pause_lock:
@@ -599,19 +640,30 @@ class MachineClient:
                             logger.info("Queue resumed")
                             await self.publish_state({'state': 'idle', 'run_id': None})
                     # Call handler and use its response
-                    response: CommandResponse = await handler(message)
+                    response = await handler(message)
                 case ImmediateCommand.CANCEL:
-                    if message.header.run_id:
-                        self._cancelled_run_ids.add(message.header.run_id)
-                        logger.info("Cancelling all commands with run_id: %s", message.header.run_id)
+                    if not run_id:
+                        response = CommandResponse(
+                            status=CommandResponseStatus.ERROR,
+                            code=CommandResponseCode.MISSING_RUN_ID,
+                            message='CANCEL command requires RUN_ID'
+                        )
+                    else:
+                        logger.info("Cancelling all commands with run_id: %s", run_id)
+                        # Clear the active run_id when cancelling (try to complete, but clear anyway)
+                        await self.run_manager.complete_run(run_id)
                         await self.publish_state({'state': 'idle', 'run_id': None})
-                    # Call handler and use its response
-                    response: CommandResponse = await handler(message)
+                        # Call handler and use its response
+                        response = await handler(message)
                 case _:
-                    # For other immediate commands, call the user-provided handler
-                    response: CommandResponse = await handler(message)
+                    # Unknown immediate command
+                    response = CommandResponse(
+                        status=CommandResponseStatus.ERROR,
+                        code=CommandResponseCode.UNKNOWN_COMMAND,
+                        message=f'Unknown immediate command: {command_name}'
+                    )
             await self._publish_command_response(
                 msg=msg,
@@ -702,6 +754,9 @@ class MachineClient:
         if not self.js:
             logger.error("JetStream not available for queue subscription")
             return
+        # Store handler for reconnection
+        self._queue_handler = handler
         # Ensure stream exists before attempting to subscribe
         await self._ensure_all_streams()
@@ -744,12 +799,11 @@ class MachineClient:
                 try:
                     while True:
                         try:
-                            # Fetch messages (batch of 1, timeout 1 second)
+                            # Fetch one message (timeout 1 second)
                             msgs = await self._cmd_queue_sub.fetch(batch=1, timeout=1.0)
                             if msgs:
-                                logger.debug("Pulled %d message(s) from queue", len(msgs))
-                            for msg in msgs:
-                                await self.process_queue_cmd(msg, handler)
+                                logger.debug("Pulled message from queue")
+                                await self.process_queue_cmd(msgs[0], handler)
                         except asyncio.TimeoutError:
                             # Timeout is expected when no messages are available
                             continue
@@ -780,8 +834,6 @@ class MachineClient:
                 logger.error("  Stream verification failed: %s", stream_check_error)
             raise
-        # Store handler for reconnection
-        self._queue_handler = handler
         logger.info("Subscribed to queue commands: %s (durable: cmd_queue_%s, stream: %s, pull consumer)",
                    self.cmd_queue, self.machine_id, self.STREAM_COMMAND_QUEUE)

puda_comms/models.py CHANGED Viewed

@@ -25,6 +25,7 @@ class CommandResponseCode(str, Enum):
     RESUME_ERROR = 'RESUME_ERROR'
     NO_EXECUTION = 'NO_EXECUTION'
     RUN_ID_MISMATCH = 'RUN_ID_MISMATCH'
+    MISSING_RUN_ID = 'MISSING_RUN_ID'
     CANCEL_ERROR = 'CANCEL_ERROR'
     MACHINE_PAUSED = 'MACHINE_PAUSED'
@@ -40,6 +41,8 @@ class MessageType(str, Enum):
 class ImmediateCommand(str, Enum):
     """Command names for immediate commands."""
+    START = 'start'
+    COMPLETE = 'complete'
     PAUSE = 'pause'
     RESUME = 'resume'
     CANCEL = 'cancel'

puda_comms/run_manager.py ADDED Viewed

@@ -0,0 +1,112 @@
+"""
+Run State Management
+Provides thread-safe run state tracking and validation for machine commands.
+"""
+import asyncio
+import logging
+from typing import Optional
+logger = logging.getLogger(__name__)
+class RunManager:
+    """
+    Manages run state for a machine.
+    Tracks the active run_id and validates that commands match the active run.
+    Provides thread-safe operations for run lifecycle management.
+    """
+    def __init__(self, machine_id: str):
+        """
+        Initialize RunManager for a machine.
+        Args:
+            machine_id: Machine identifier
+        """
+        self.machine_id = machine_id
+        self._active_run_id: Optional[str] = None
+        self._lock = asyncio.Lock()
+    async def start_run(self, run_id: str) -> bool:
+        """
+        Set active run_id. Returns True if successful, False if run already active.
+        Args:
+            run_id: Run ID to set as active
+        Returns:
+            True if run was started successfully, False if another run is already active
+        """
+        async with self._lock:
+            if self._active_run_id is not None:
+                logger.warning(
+                    "Cannot start run %s: run %s is already active on machine %s",
+                    run_id, self._active_run_id, self.machine_id
+                )
+                return False
+            self._active_run_id = run_id
+            logger.info("Started run %s on machine %s", run_id, self.machine_id)
+            return True
+    async def complete_run(self, run_id: str) -> bool:
+        """
+        Clear run_id if it matches. Returns True if successful.
+        Args:
+            run_id: Run ID to complete
+        Returns:
+            True if run was completed successfully, False if run_id doesn't match active run
+        """
+        async with self._lock:
+            if self._active_run_id != run_id:
+                logger.warning(
+                    "Cannot complete run %s: active run is %s on machine %s",
+                    run_id, self._active_run_id, self.machine_id
+                )
+                return False
+            self._active_run_id = None
+            logger.info("Completed run %s on machine %s", run_id, self.machine_id)
+            return True
+    async def validate_run_id(self, run_id: str) -> bool:
+        """
+        Check if run_id matches active run. Returns True if valid.
+        Args:
+            run_id: Run ID to validate (required)
+        Returns:
+            True if run_id matches active run, False otherwise
+        """
+        async with self._lock:
+            # If no active run, any run_id is invalid
+            if self._active_run_id is None:
+                logger.warning(
+                    "Run ID validation failed: no active run, got %s on machine %s",
+                    run_id, self.machine_id
+                )
+                return False
+            # Run_id must match active run
+            if self._active_run_id != run_id:
+                logger.warning(
+                    "Run ID validation failed: expected %s, got %s on machine %s",
+                    self._active_run_id, run_id, self.machine_id
+                )
+                return False
+            return True
+    def get_active_run_id(self) -> Optional[str]:
+        """
+        Get current active run_id.
+        Returns:
+            Active run_id if one exists, None otherwise
+        """
+        return self._active_run_id

{puda_comms-0.0.4.dist-info → puda_comms-0.0.5.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.3
 Name: puda-comms
-Version: 0.0.4
+Version: 0.0.5
 Summary: Communication library for the PUDA platform.
 Author: zhao
 Author-email: zhao <20024592+agentzhao@users.noreply.github.com>

puda_comms-0.0.5.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,9 @@
+puda_comms/__init__.py,sha256=lntvVFJJez_rv5lZy5mYj4_43B9Y3NRNzxWfBuSAQ1M,194
+puda_comms/command_service.py,sha256=Lxk-CUan_DwftBZlSYO3VnddxaM9fYKxxhWF8VCqABY,30423
+puda_comms/execution_state.py,sha256=aTaejCnJgg1y_FP-ymIC1GQzqC81FIWo0RZ18XzAQnA,2881
+puda_comms/machine_client.py,sha256=OnA8we1c62n1aEFr0NfiapklHWXR-WFzq5FXQrvuUM8,39378
+puda_comms/models.py,sha256=CfXq_Wxqk5OQo5VknXR-BdLIT2SM69s8cGxGYr9T8WI,3701
+puda_comms/run_manager.py,sha256=_s4VYVGwtRMcduz95_DPIObso4uWRS24n5NH7AiGgjI,3591
+puda_comms-0.0.5.dist-info/WHEEL,sha256=ZyFSCYkV2BrxH6-HRVRg3R9Fo7MALzer9KiPYqNxSbo,79
+puda_comms-0.0.5.dist-info/METADATA,sha256=REBvcpJsUCxiFCKihVVReP0lh6IkJcBl4I8XohjhSHE,11512
+puda_comms-0.0.5.dist-info/RECORD,,

puda_comms-0.0.4.dist-info/RECORD DELETED Viewed

@@ -1,8 +0,0 @@
-puda_comms/__init__.py,sha256=lntvVFJJez_rv5lZy5mYj4_43B9Y3NRNzxWfBuSAQ1M,194
-puda_comms/command_service.py,sha256=KFremcEGfsTeUVQMIhyk1knYmUCvRYQ12vS_jy_14wA,25193
-puda_comms/execution_state.py,sha256=aTaejCnJgg1y_FP-ymIC1GQzqC81FIWo0RZ18XzAQnA,2881
-puda_comms/machine_client.py,sha256=wj6t_QHGs7l1Oc8JQ6hq2hqBd5C14TCPA_dTU9qOLzw,37430
-puda_comms/models.py,sha256=9ZGX0PR7SgMBOL5zVLrPuSUhZqutQU96PubyjyQLhf8,3617
-puda_comms-0.0.4.dist-info/WHEEL,sha256=ZyFSCYkV2BrxH6-HRVRg3R9Fo7MALzer9KiPYqNxSbo,79
-puda_comms-0.0.4.dist-info/METADATA,sha256=0cMHDub_3NZt7Cj5U1jzrQXI8atQqpMM-i3vSMrT5lo,11512
-puda_comms-0.0.4.dist-info/RECORD,,

{puda_comms-0.0.4.dist-info → puda_comms-0.0.5.dist-info}/WHEEL RENAMED Viewed

File without changes

puda-comms 0.0.4__py3-none-any.whl → 0.0.5__py3-none-any.whl

puda-comms 0.0.4py3-none-any.whl → 0.0.5py3-none-any.whl