PyPI - robosystems-client - Versions diffs - 0.1.19__py3-none-any.whl → 0.2.1__py3-none-any.whl - Mend

robosystems-client 0.1.19py3-none-any.whl → 0.2.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of robosystems-client might be problematic. Click here for more details.

Files changed (141) hide show

robosystems_client/extensions/operation_client.py CHANGED Viewed

@@ -83,7 +83,12 @@ class OperationClient:
   def monitor_operation(
     self, operation_id: str, options: MonitorOptions = None
   ) -> OperationResult:
-    """Monitor a single operation until completion"""
+    """Monitor a single operation until completion
+    The SSE stream will replay all events from the beginning (from_sequence=0),
+    so even if the operation completed before we connected, we'll still receive
+    all events including the completion event.
+    """
     if options is None:
       options = MonitorOptions()
@@ -91,8 +96,9 @@ class OperationClient:
     completed = False
     error = None
-    # Set up SSE connection
-    sse_config = SSEConfig(base_url=self.base_url)
+    # Set up SSE connection with event replay from the beginning
+    # This handles the race condition where the operation may have already completed
+    sse_config = SSEConfig(base_url=self.base_url, headers=self.headers)
     sse_client = SSEClient(sse_config)
     def on_operation_started(data):
@@ -265,6 +271,8 @@ class AsyncOperationClient:
   def __init__(self, config: Dict[str, Any]):
     self.config = config
     self.base_url = config["base_url"]
+    self.headers = config.get("headers", {})
+    self.token = config.get("token")
     self.active_operations: Dict[str, AsyncSSEClient] = {}
   async def monitor_operation(
@@ -279,7 +287,7 @@ class AsyncOperationClient:
     error = None
     # Set up SSE connection
-    sse_config = SSEConfig(base_url=self.base_url)
+    sse_config = SSEConfig(base_url=self.base_url, headers=self.headers)
     sse_client = AsyncSSEClient(sse_config)
     def on_operation_started(data):

robosystems_client/extensions/query_client.py CHANGED Viewed

@@ -98,45 +98,59 @@ class QueryClient:
     )
     # Execute the query through the generated client
-    from ..client import Client
-    # Create client with headers
-    client = Client(base_url=self.base_url, headers=self.headers)
+    from ..client import AuthenticatedClient
+    # Create authenticated client with X-API-Key
+    if not self.token:
+      raise Exception("No API key provided. Set X-API-Key in headers.")
+    client = AuthenticatedClient(
+      base_url=self.base_url,
+      token=self.token,
+      prefix="",
+      auth_header_name="X-API-Key",
+      headers=self.headers,
+    )
     try:
       kwargs = {"graph_id": graph_id, "client": client, "body": query_request}
-      # Only add token if it's a valid string
-      if self.token and isinstance(self.token, str) and self.token.strip():
-        kwargs["token"] = self.token
       response = execute_cypher_query(**kwargs)
       # Check response type and handle accordingly
       if hasattr(response, "parsed") and response.parsed:
         response_data = response.parsed
+        # Handle both dict and object responses
+        if isinstance(response_data, dict):
+          # Response is a plain dict
+          data = response_data
+        else:
+          # Response is an object with additional_properties
+          data = (
+            response_data.additional_properties
+            if hasattr(response_data, "additional_properties")
+            else response_data
+          )
         # Check if this is an immediate response
-        if hasattr(response_data, "data") and hasattr(response_data, "columns"):
+        if "data" in data and "columns" in data:
           return QueryResult(
-            data=response_data.data,
-            columns=response_data.columns,
-            row_count=getattr(response_data, "row_count", len(response_data.data)),
-            execution_time_ms=getattr(response_data, "execution_time_ms", 0),
+            data=data["data"],
+            columns=data["columns"],
+            row_count=data.get("row_count", len(data["data"])),
+            execution_time_ms=data.get("execution_time_ms", 0),
             graph_id=graph_id,
-            timestamp=getattr(response_data, "timestamp", datetime.now().isoformat()),
+            timestamp=data.get("timestamp", datetime.now().isoformat()),
           )
         # Check if this is a queued response
-        if (
-          hasattr(response_data, "status")
-          and response_data.status == "queued"
-          and hasattr(response_data, "operation_id")
-        ):
+        if data.get("status") == "queued" and "operation_id" in data:
           queued_response = QueuedQueryResponse(
-            status=response_data.status,
-            operation_id=response_data.operation_id,
-            queue_position=getattr(response_data, "queue_position", 0),
-            estimated_wait_seconds=getattr(response_data, "estimated_wait_seconds", 0),
-            message=getattr(response_data, "message", "Query queued"),
+            status=data["status"],
+            operation_id=data["operation_id"],
+            queue_position=data.get("queue_position", 0),
+            estimated_wait_seconds=data.get("estimated_wait_seconds", 0),
+            message=data.get("message", "Query queued"),
           )
           # Notify about queue status
@@ -182,7 +196,7 @@ class QueryClient:
     error = None
     # Set up SSE connection
-    sse_config = SSEConfig(base_url=self.base_url)
+    sse_config = SSEConfig(base_url=self.base_url, headers=self.headers)
     self.sse_client = SSEClient(sse_config)
     # Set up event handlers

robosystems_client/extensions/sse_client.py CHANGED Viewed

@@ -124,9 +124,11 @@ class SSEClient:
     try:
       event_buffer = {"event": None, "data": [], "id": None, "retry": None}
+      print("[SSE DEBUG] Starting to process events...")
       for line in self._response.iter_lines():
         if self.closed:
+          print("[SSE DEBUG] Stream closed, breaking out of loop")
           break
         line = line.strip()
@@ -134,6 +136,7 @@ class SSEClient:
         # Empty line indicates end of event
         if not line:
           if event_buffer["data"] or event_buffer["event"]:
+            print(f"[SSE DEBUG] Dispatching event: {event_buffer.get('event')}")
             self._dispatch_event(event_buffer)
           event_buffer = {"event": None, "data": [], "id": None, "retry": None}
           continue
@@ -169,9 +172,13 @@ class SSEClient:
       # Handle final event if stream ends without empty line
       if event_buffer["data"] or event_buffer["event"]:
+        print("[SSE DEBUG] Dispatching final event after stream end")
         self._dispatch_event(event_buffer)
+      print("[SSE DEBUG] Event processing loop ended")
     except Exception as error:
+      print(f"[SSE DEBUG] Exception in event processing: {error}")
       if not self.closed:
         self.emit("error", error)
@@ -394,9 +401,13 @@ class AsyncSSEClient:
       # Handle final event if stream ends without empty line
       if event_buffer["data"] or event_buffer["event"]:
+        print("[SSE DEBUG] Dispatching final event after stream end")
         self._dispatch_event(event_buffer)
+      print("[SSE DEBUG] Event processing loop ended")
     except Exception as error:
+      print(f"[SSE DEBUG] Exception in event processing: {error}")
       if not self.closed:
         self.emit("error", error)

robosystems_client/extensions/table_ingest_client.py ADDED Viewed

@@ -0,0 +1,466 @@
+"""Table Ingest Client for RoboSystems API
+Simplifies uploading Parquet files to staging tables and ingesting them into graphs.
+"""
+from dataclasses import dataclass
+from io import BytesIO
+from pathlib import Path
+from typing import Dict, Any, Optional, Callable, List, Union, BinaryIO
+import json
+import logging
+import httpx
+from ..api.tables.get_upload_url_v1_graphs_graph_id_tables_table_name_files_post import (
+  sync_detailed as get_upload_url,
+)
+from ..api.tables.update_file_v1_graphs_graph_id_tables_files_file_id_patch import (
+  sync_detailed as update_file,
+)
+from ..api.tables.list_tables_v1_graphs_graph_id_tables_get import (
+  sync_detailed as list_tables,
+)
+from ..api.tables.ingest_tables_v1_graphs_graph_id_tables_ingest_post import (
+  sync_detailed as ingest_tables,
+)
+from ..models.file_upload_request import FileUploadRequest
+from ..models.file_update_request import FileUpdateRequest
+from ..models.bulk_ingest_request import BulkIngestRequest
+logger = logging.getLogger(__name__)
+@dataclass
+class UploadOptions:
+  """Options for file upload operations"""
+  on_progress: Optional[Callable[[str], None]] = None
+  fix_localstack_url: bool = True  # Auto-fix LocalStack URLs for localhost
+  file_name: Optional[str] = None  # Override file name (useful for buffer uploads)
+@dataclass
+class IngestOptions:
+  """Options for table ingestion operations"""
+  ignore_errors: bool = True
+  rebuild: bool = False
+  on_progress: Optional[Callable[[str], None]] = None
+@dataclass
+class UploadResult:
+  """Result from file upload operation"""
+  file_id: str
+  file_size: int
+  row_count: int
+  table_name: str
+  file_name: str
+  success: bool = True
+  error: Optional[str] = None
+@dataclass
+class TableInfo:
+  """Information about a staging table"""
+  table_name: str
+  row_count: int
+  file_count: int
+  total_size_bytes: int
+class TableIngestClient:
+  """Enhanced table ingest client with simplified upload workflow"""
+  def __init__(self, config: Dict[str, Any]):
+    self.config = config
+    self.base_url = config["base_url"]
+    self.headers = config.get("headers", {})
+    self.token = config.get("token")
+    # Create httpx client for S3 uploads
+    self._http_client = httpx.Client(timeout=120.0)
+  def upload_parquet_file(
+    self,
+    graph_id: str,
+    table_name: str,
+    file_or_buffer: Union[Path, str, BytesIO, BinaryIO],
+    options: Optional[UploadOptions] = None,
+  ) -> UploadResult:
+    """
+    Upload a Parquet file to a staging table.
+    This method handles the complete 3-step upload process:
+    1. Get presigned upload URL
+    2. Upload file to S3
+    3. Update file metadata
+    Args:
+        graph_id: The graph ID
+        table_name: Name of the staging table
+        file_or_buffer: Path to the Parquet file or BytesIO/BinaryIO buffer
+        options: Upload options
+    Returns:
+        UploadResult with upload details
+    """
+    if options is None:
+      options = UploadOptions()
+    # Auto-detect if this is a file path or buffer
+    is_buffer = isinstance(file_or_buffer, (BytesIO, BinaryIO)) or hasattr(
+      file_or_buffer, "read"
+    )
+    if is_buffer:
+      # Handle buffer upload
+      file_name = options.file_name or "data.parquet"
+    else:
+      # Handle file path upload
+      file_path = Path(file_or_buffer)
+      file_name = file_path.name
+      if not file_path.exists():
+        return UploadResult(
+          file_id="",
+          file_size=0,
+          row_count=0,
+          table_name=table_name,
+          file_name=file_name,
+          success=False,
+          error=f"File not found: {file_path}",
+        )
+    try:
+      # Import client here to avoid circular imports
+      from ..client import AuthenticatedClient
+      # Create authenticated client with X-API-Key
+      # The token is extracted from X-API-Key header in extensions.py
+      if not self.token:
+        return UploadResult(
+          file_id="",
+          file_size=0,
+          row_count=0,
+          table_name=table_name,
+          file_name=file_name,
+          success=False,
+          error="No API key provided. Set X-API-Key in headers.",
+        )
+      client = AuthenticatedClient(
+        base_url=self.base_url,
+        token=self.token,
+        prefix="",  # No prefix for X-API-Key
+        auth_header_name="X-API-Key",  # Use X-API-Key header instead of Authorization
+        headers=self.headers,
+      )
+      # Step 1: Get presigned upload URL
+      if options.on_progress:
+        options.on_progress(
+          f"Getting upload URL for {file_name} -> table '{table_name}'..."
+        )
+      upload_request = FileUploadRequest(
+        file_name=file_name, content_type="application/x-parquet"
+      )
+      kwargs = {
+        "graph_id": graph_id,
+        "table_name": table_name,
+        "client": client,
+        "body": upload_request,
+      }
+      response = get_upload_url(**kwargs)
+      if not response.parsed:
+        error_msg = f"Failed to get upload URL (status: {response.status_code})"
+        if hasattr(response, "content"):
+          try:
+            error_detail = json.loads(response.content)
+            error_msg = f"{error_msg}: {error_detail}"
+          except (json.JSONDecodeError, ValueError):
+            error_msg = f"{error_msg}: {response.content[:200]}"
+        return UploadResult(
+          file_id="",
+          file_size=0,
+          row_count=0,
+          table_name=table_name,
+          file_name=file_name,
+          success=False,
+          error=error_msg,
+        )
+      upload_url = response.parsed.upload_url
+      file_id = response.parsed.file_id
+      # Fix LocalStack URL if needed
+      if options.fix_localstack_url and "localstack:4566" in upload_url:
+        upload_url = upload_url.replace("localstack:4566", "localhost:4566")
+        logger.debug("Fixed LocalStack URL for localhost access")
+      # Step 2: Upload file to S3
+      if options.on_progress:
+        options.on_progress(f"Uploading {file_name} to S3...")
+      # Read file content - handle both paths and buffers
+      if is_buffer:
+        # Read from buffer
+        if hasattr(file_or_buffer, "getvalue"):
+          file_content = file_or_buffer.getvalue()
+        else:
+          # BinaryIO or file-like object
+          file_or_buffer.seek(0)
+          file_content = file_or_buffer.read()
+        file_size = len(file_content)
+      else:
+        # Read from file path
+        with open(file_path, "rb") as f:
+          file_content = f.read()
+        file_size = len(file_content)
+      s3_response = self._http_client.put(
+        upload_url,
+        content=file_content,
+        headers={"Content-Type": "application/x-parquet"},
+      )
+      s3_response.raise_for_status()
+      # Step 3: Get row count and update file metadata
+      if options.on_progress:
+        options.on_progress(f"Updating file metadata for {file_name}...")
+      try:
+        import pyarrow.parquet as pq
+        if is_buffer:
+          # Read from buffer for row count
+          if hasattr(file_or_buffer, "seek"):
+            file_or_buffer.seek(0)
+          parquet_table = pq.read_table(file_or_buffer)
+        else:
+          # Read from file path
+          parquet_table = pq.read_table(file_path)
+        row_count = parquet_table.num_rows
+      except ImportError:
+        logger.warning(
+          "pyarrow not installed, row count will be estimated from file size"
+        )
+        # Rough estimate: ~100 bytes per row for typical data
+        row_count = file_size // 100
+      metadata_update = FileUpdateRequest(
+        file_size_bytes=file_size, row_count=row_count
+      )
+      kwargs = {
+        "graph_id": graph_id,
+        "file_id": file_id,
+        "client": client,
+        "body": metadata_update,
+      }
+      update_response = update_file(**kwargs)
+      if not update_response.parsed:
+        return UploadResult(
+          file_id=file_id,
+          file_size=file_size,
+          row_count=row_count,
+          table_name=table_name,
+          file_name=file_name,
+          success=False,
+          error="Failed to update file metadata",
+        )
+      if options.on_progress:
+        options.on_progress(
+          f"✅ Uploaded {file_name} ({file_size:,} bytes, {row_count:,} rows)"
+        )
+      return UploadResult(
+        file_id=file_id,
+        file_size=file_size,
+        row_count=row_count,
+        table_name=table_name,
+        file_name=file_name,
+        success=True,
+      )
+    except Exception as e:
+      logger.error(f"Upload failed for {file_name}: {e}")
+      return UploadResult(
+        file_id="",
+        file_size=0,
+        row_count=0,
+        table_name=table_name,
+        file_name=file_name,
+        success=False,
+        error=str(e),
+      )
+  def list_staging_tables(self, graph_id: str) -> List[TableInfo]:
+    """
+    List all staging tables in a graph.
+    Args:
+        graph_id: The graph ID
+    Returns:
+        List of TableInfo objects
+    """
+    try:
+      from ..client import AuthenticatedClient
+      if not self.token:
+        logger.error("No API key provided")
+        return []
+      client = AuthenticatedClient(
+        base_url=self.base_url,
+        token=self.token,
+        prefix="",
+        auth_header_name="X-API-Key",
+        headers=self.headers,
+      )
+      kwargs = {"graph_id": graph_id, "client": client}
+      response = list_tables(**kwargs)
+      if not response.parsed:
+        logger.error("Failed to list tables")
+        return []
+      tables = []
+      for table_data in response.parsed.tables:
+        tables.append(
+          TableInfo(
+            table_name=table_data.table_name,
+            row_count=table_data.row_count,
+            file_count=table_data.file_count,
+            total_size_bytes=table_data.total_size_bytes,
+          )
+        )
+      return tables
+    except Exception as e:
+      logger.error(f"Failed to list tables: {e}")
+      return []
+  def ingest_all_tables(
+    self, graph_id: str, options: Optional[IngestOptions] = None
+  ) -> Dict[str, Any]:
+    """
+    Ingest all staging tables into the graph.
+    Args:
+        graph_id: The graph ID
+        options: Ingest options
+    Returns:
+        Dictionary with ingestion results
+    """
+    if options is None:
+      options = IngestOptions()
+    try:
+      from ..client import AuthenticatedClient
+      if not self.token:
+        return {"success": False, "error": "No API key provided"}
+      client = AuthenticatedClient(
+        base_url=self.base_url,
+        token=self.token,
+        prefix="",
+        auth_header_name="X-API-Key",
+        headers=self.headers,
+      )
+      if options.on_progress:
+        options.on_progress("Starting table ingestion...")
+      ingest_request = BulkIngestRequest(
+        ignore_errors=options.ignore_errors, rebuild=options.rebuild
+      )
+      kwargs = {
+        "graph_id": graph_id,
+        "client": client,
+        "body": ingest_request,
+      }
+      response = ingest_tables(**kwargs)
+      if not response.parsed:
+        return {"success": False, "error": "Failed to ingest tables"}
+      result = {
+        "success": True,
+        "operation_id": getattr(response.parsed, "operation_id", None),
+        "message": getattr(response.parsed, "message", "Ingestion started"),
+      }
+      if options.on_progress:
+        options.on_progress("✅ Table ingestion completed")
+      return result
+    except Exception as e:
+      logger.error(f"Failed to ingest tables: {e}")
+      return {"success": False, "error": str(e)}
+  def upload_and_ingest(
+    self,
+    graph_id: str,
+    table_name: str,
+    file_path: Path,
+    upload_options: Optional[UploadOptions] = None,
+    ingest_options: Optional[IngestOptions] = None,
+  ) -> Dict[str, Any]:
+    """
+    Convenience method to upload a file and immediately ingest it.
+    Args:
+        graph_id: The graph ID
+        table_name: Name of the staging table
+        file_path: Path to the Parquet file
+        upload_options: Upload options
+        ingest_options: Ingest options
+    Returns:
+        Dictionary with upload and ingest results
+    """
+    # Upload the file
+    upload_result = self.upload_parquet_file(
+      graph_id, table_name, file_path, upload_options
+    )
+    if not upload_result.success:
+      return {
+        "success": False,
+        "upload": upload_result,
+        "ingest": None,
+        "error": upload_result.error,
+      }
+    # Ingest the table
+    ingest_result = self.ingest_all_tables(graph_id, ingest_options)
+    return {
+      "success": upload_result.success and ingest_result.get("success", False),
+      "upload": upload_result,
+      "ingest": ingest_result,
+    }
+  def close(self):
+    """Close HTTP client connections"""
+    if self._http_client:
+      self._http_client.close()

robosystems-client 0.1.19__py3-none-any.whl → 0.2.1__py3-none-any.whl

Potentially problematic release.

robosystems-client 0.1.19py3-none-any.whl → 0.2.1py3-none-any.whl