PyPI - remdb - Versions diffs - 0.3.7__py3-none-any.whl → 0.3.133__py3-none-any.whl - Mend

remdb 0.3.7py3-none-any.whl → 0.3.133py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (107) hide show

rem/__init__.py +129 -2
rem/agentic/README.md +76 -0
rem/agentic/__init__.py +15 -0
rem/agentic/agents/__init__.py +16 -2
rem/agentic/agents/sse_simulator.py +502 -0
rem/agentic/context.py +51 -25
rem/agentic/llm_provider_models.py +301 -0
rem/agentic/mcp/tool_wrapper.py +112 -17
rem/agentic/otel/setup.py +93 -4
rem/agentic/providers/phoenix.py +314 -132
rem/agentic/providers/pydantic_ai.py +215 -26
rem/agentic/schema.py +361 -21
rem/agentic/tools/rem_tools.py +3 -3
rem/api/README.md +238 -1
rem/api/deps.py +255 -0
rem/api/main.py +154 -37
rem/api/mcp_router/resources.py +1 -1
rem/api/mcp_router/server.py +26 -5
rem/api/mcp_router/tools.py +465 -7
rem/api/middleware/tracking.py +172 -0
rem/api/routers/admin.py +494 -0
rem/api/routers/auth.py +124 -0
rem/api/routers/chat/completions.py +402 -20
rem/api/routers/chat/models.py +88 -10
rem/api/routers/chat/otel_utils.py +33 -0
rem/api/routers/chat/sse_events.py +542 -0
rem/api/routers/chat/streaming.py +642 -45
rem/api/routers/dev.py +81 -0
rem/api/routers/feedback.py +268 -0
rem/api/routers/messages.py +473 -0
rem/api/routers/models.py +78 -0
rem/api/routers/query.py +360 -0
rem/api/routers/shared_sessions.py +406 -0
rem/auth/middleware.py +126 -27
rem/cli/commands/README.md +237 -64
rem/cli/commands/ask.py +13 -10
rem/cli/commands/cluster.py +1808 -0
rem/cli/commands/configure.py +5 -6
rem/cli/commands/db.py +396 -139
rem/cli/commands/experiments.py +469 -74
rem/cli/commands/process.py +22 -15
rem/cli/commands/scaffold.py +47 -0
rem/cli/commands/schema.py +97 -50
rem/cli/main.py +29 -6
rem/config.py +10 -3
rem/models/core/core_model.py +7 -1
rem/models/core/experiment.py +54 -0
rem/models/core/rem_query.py +5 -2
rem/models/entities/__init__.py +21 -0
rem/models/entities/domain_resource.py +38 -0
rem/models/entities/feedback.py +123 -0
rem/models/entities/message.py +30 -1
rem/models/entities/session.py +83 -0
rem/models/entities/shared_session.py +180 -0
rem/models/entities/user.py +10 -3
rem/registry.py +373 -0
rem/schemas/agents/rem.yaml +7 -3
rem/services/content/providers.py +92 -133
rem/services/content/service.py +92 -20
rem/services/dreaming/affinity_service.py +2 -16
rem/services/dreaming/moment_service.py +2 -15
rem/services/embeddings/api.py +24 -17
rem/services/embeddings/worker.py +16 -16
rem/services/phoenix/EXPERIMENT_DESIGN.md +3 -3
rem/services/phoenix/client.py +302 -28
rem/services/postgres/README.md +159 -15
rem/services/postgres/__init__.py +2 -1
rem/services/postgres/diff_service.py +531 -0
rem/services/postgres/pydantic_to_sqlalchemy.py +427 -129
rem/services/postgres/repository.py +132 -0
rem/services/postgres/schema_generator.py +291 -9
rem/services/postgres/service.py +6 -6
rem/services/rate_limit.py +113 -0
rem/services/rem/README.md +14 -0
rem/services/rem/parser.py +44 -9
rem/services/rem/service.py +36 -2
rem/services/session/compression.py +24 -1
rem/services/session/reload.py +1 -1
rem/services/user_service.py +98 -0
rem/settings.py +399 -29
rem/sql/background_indexes.sql +21 -16
rem/sql/migrations/001_install.sql +387 -54
rem/sql/migrations/002_install_models.sql +2320 -393
rem/sql/migrations/003_optional_extensions.sql +326 -0
rem/sql/migrations/004_cache_system.sql +548 -0
rem/utils/__init__.py +18 -0
rem/utils/constants.py +97 -0
rem/utils/date_utils.py +228 -0
rem/utils/embeddings.py +17 -4
rem/utils/files.py +167 -0
rem/utils/mime_types.py +158 -0
rem/utils/model_helpers.py +156 -1
rem/utils/schema_loader.py +282 -35
rem/utils/sql_paths.py +146 -0
rem/utils/sql_types.py +3 -1
rem/utils/vision.py +9 -14
rem/workers/README.md +14 -14
rem/workers/__init__.py +3 -1
rem/workers/db_listener.py +579 -0
rem/workers/db_maintainer.py +74 -0
rem/workers/unlogged_maintainer.py +463 -0
{remdb-0.3.7.dist-info → remdb-0.3.133.dist-info}/METADATA +460 -303
{remdb-0.3.7.dist-info → remdb-0.3.133.dist-info}/RECORD +105 -74
{remdb-0.3.7.dist-info → remdb-0.3.133.dist-info}/WHEEL +1 -1
rem/sql/002_install_models.sql +0 -1068
rem/sql/install_models.sql +0 -1038
{remdb-0.3.7.dist-info → remdb-0.3.133.dist-info}/entry_points.txt +0 -0

rem/api/routers/chat/models.py CHANGED Viewed

@@ -1,17 +1,43 @@
 """
 OpenAI-compatible API models for chat completions.
-Design Pattern
+Design Pattern:
 - Full OpenAI compatibility for drop-in replacement
 - Support for streaming (SSE) and non-streaming modes
 - Response format control (text vs json_object)
-- Headers map to AgentContext (X-User-Id, X-Tenant-Id, X-Agent-Schema, etc.)
+- Headers map to AgentContext for session/context control
+- Body fields for OpenAI-compatible parameters + metadata
+Headers (context control):
+    X-User-Id        → context.user_id (user identifier)
+    X-Tenant-Id      → context.tenant_id (multi-tenancy, default: "default")
+    X-Session-Id     → context.session_id (conversation continuity)
+    X-Agent-Schema   → context.agent_schema_uri (which agent to use, default: "rem")
+    X-Model-Name     → context.default_model (model override)
+    X-Chat-Is-Audio  → triggers audio transcription ("true"/"false")
+    X-Is-Eval        → context.is_eval (marks session as evaluation, sets mode=EVALUATION)
+Body Fields (OpenAI-compatible + extensions):
+    model            → LLM model (e.g., "openai:gpt-4.1", "anthropic:claude-sonnet-4-5-20250929")
+    messages         → Chat conversation history
+    temperature      → Sampling temperature (0-2)
+    max_tokens       → Max tokens (deprecated, use max_completion_tokens)
+    max_completion_tokens → Max tokens to generate
+    stream           → Enable SSE streaming
+    metadata         → Key-value pairs merged with session metadata (for evals/experiments)
+    store            → Whether to store for distillation/evaluation
+    seed             → Deterministic sampling seed
+    top_p            → Nucleus sampling probability
+    reasoning_effort → low/medium/high for o-series models
+    service_tier     → auto/flex/priority/default
 """
-from typing import Literal
+from typing import Any, Literal
 from pydantic import BaseModel, Field
+from rem.settings import settings
 # Request models
 class ChatMessage(BaseModel):
@@ -44,17 +70,26 @@ class ChatCompletionRequest(BaseModel):
     Compatible with OpenAI's /v1/chat/completions endpoint.
     Headers Map to AgentContext:
-    - X-User-Id → context.user_id
-    - X-Tenant-Id → context.tenant_id
-    - X-Session-Id → context.session_id
-    - X-Agent-Schema → context.agent_schema_uri
+        X-User-Id        → context.user_id
+        X-Tenant-Id      → context.tenant_id (default: "default")
+        X-Session-Id     → context.session_id
+        X-Agent-Schema   → context.agent_schema_uri (default: "rem")
+        X-Model-Name     → context.default_model
+        X-Chat-Is-Audio  → triggers audio transcription
+        X-Is-Eval        → context.is_eval (sets session mode=EVALUATION)
+    Body Fields for Metadata/Evals:
+        metadata         → Key-value pairs merged with session metadata
+        store            → Whether to store for distillation/evaluation
     Note: Model is specified in body.model (standard OpenAI field), not headers.
     """
-    model: str = Field(
-        default="anthropic:claude-sonnet-4-5-20250929",
-        description="Model to use (standard OpenAI field)",
+    # TODO: default should come from settings.llm.default_model at request time
+    # Using None and resolving in endpoint to avoid import-time settings evaluation
+    model: str | None = Field(
+        default=None,
+        description="Model to use. Defaults to LLM__DEFAULT_MODEL from settings.",
     )
     messages: list[ChatMessage] = Field(description="Chat conversation history")
     temperature: float | None = Field(default=None, ge=0, le=2)
@@ -69,6 +104,49 @@ class ChatCompletionRequest(BaseModel):
         default=None,
         description="Response format. Set type='json_object' to enable JSON mode.",
     )
+    # Additional OpenAI-compatible fields
+    metadata: dict[str, str] | None = Field(
+        default=None,
+        description="Key-value pairs attached to the request (max 16 keys, 64/512 char limits). "
+        "Merged with session metadata for persistence.",
+    )
+    store: bool | None = Field(
+        default=None,
+        description="Whether to store for distillation/evaluation purposes.",
+    )
+    max_completion_tokens: int | None = Field(
+        default=None,
+        ge=1,
+        description="Max tokens to generate (replaces deprecated max_tokens).",
+    )
+    seed: int | None = Field(
+        default=None,
+        description="Seed for deterministic sampling (best effort).",
+    )
+    top_p: float | None = Field(
+        default=None,
+        ge=0,
+        le=1,
+        description="Nucleus sampling probability. Use temperature OR top_p, not both.",
+    )
+    logprobs: bool | None = Field(
+        default=None,
+        description="Whether to return log probabilities for output tokens.",
+    )
+    top_logprobs: int | None = Field(
+        default=None,
+        ge=0,
+        le=20,
+        description="Number of most likely tokens to return at each position (requires logprobs=true).",
+    )
+    reasoning_effort: Literal["low", "medium", "high"] | None = Field(
+        default=None,
+        description="Reasoning effort for o-series models (low/medium/high).",
+    )
+    service_tier: Literal["auto", "flex", "priority", "default"] | None = Field(
+        default=None,
+        description="Service tier for processing (flex is 50% cheaper but slower).",
+    )
 # Response models

rem/api/routers/chat/otel_utils.py ADDED Viewed

@@ -0,0 +1,33 @@
+"""OTEL utilities for chat routers."""
+from loguru import logger
+def get_tracer():
+    """Get the OpenTelemetry tracer for chat completions."""
+    try:
+        from opentelemetry import trace
+        return trace.get_tracer("rem.chat.completions")
+    except Exception:
+        return None
+def get_current_trace_context() -> tuple[str | None, str | None]:
+    """Get trace_id and span_id from current OTEL context.
+    Returns:
+        Tuple of (trace_id, span_id) as hex strings, or (None, None) if not available.
+    """
+    try:
+        from opentelemetry import trace
+        span = trace.get_current_span()
+        ctx = span.get_span_context()
+        if ctx.is_valid:
+            trace_id = format(ctx.trace_id, '032x')
+            span_id = format(ctx.span_id, '016x')
+            return trace_id, span_id
+    except Exception as e:
+        logger.debug(f"Could not get trace context: {e}")
+    return None, None

rem/api/routers/chat/sse_events.py ADDED Viewed

@@ -0,0 +1,542 @@
+"""
+SSE Event Types for Rich Streaming Responses.
+This module defines custom Server-Sent Events (SSE) event types that extend
+beyond simple text streaming.
+## SSE Protocol
+Text content uses **OpenAI-compatible format** (plain `data:` prefix):
+```
+data: {"id":"chatcmpl-...","choices":[{"delta":{"content":"Hello"}}]}
+```
+Custom events use **named event format** (`event:` prefix):
+```
+event: reasoning
+data: {"type": "reasoning", "content": "Analyzing...", "step": 1}
+```
+## Event Types
+| Event | Format | Purpose |
+|-------|--------|---------|
+| (text) | `data:` (OpenAI) | Content chunks - main response |
+| reasoning | `event:` | Model thinking/chain-of-thought |
+| progress | `event:` | Step indicators |
+| tool_call | `event:` | Tool invocation start/complete |
+| metadata | `event:` | System metadata (confidence, sources) |
+| action_request | `event:` | UI solicitation (buttons, forms) |
+| error | `event:` | Error notifications |
+| done | `event:` | Stream completion marker |
+## Action Schema Design
+- Inspired by Microsoft Adaptive Cards (https://adaptivecards.io/)
+- JSON Schema-based UI element definitions
+- Cross-platform compatibility for React, mobile, etc.
+## References
+- MDN SSE: https://developer.mozilla.org/en-US/docs/Web/API/Server-sent_events
+- Adaptive Cards: https://adaptivecards.io/explorer/
+- Model Context Protocol: https://modelcontextprotocol.io/specification/2025-06-18
+"""
+from enum import Enum
+from typing import Any, Literal
+from pydantic import BaseModel, Field
+class SSEEventType(str, Enum):
+    """SSE event types for streaming responses."""
+    TEXT_DELTA = "text_delta"       # Standard text chunk
+    REASONING = "reasoning"          # Model thinking/reasoning
+    ACTION_REQUEST = "action_request"  # UI action solicitation
+    METADATA = "metadata"            # System metadata
+    PROGRESS = "progress"            # Progress indicator
+    TOOL_CALL = "tool_call"         # Tool invocation
+    ERROR = "error"                 # Error notification
+    DONE = "done"                   # Stream complete
+# =============================================================================
+# Action Solicitation Schema (Adaptive Cards-inspired)
+# =============================================================================
+class ActionStyle(str, Enum):
+    """Visual style for action buttons."""
+    DEFAULT = "default"
+    PRIMARY = "primary"
+    SECONDARY = "secondary"
+    DESTRUCTIVE = "destructive"
+    POSITIVE = "positive"
+class ActionSubmit(BaseModel):
+    """
+    Submit action - triggers callback to server with payload.
+    Inspired by Adaptive Cards Action.Submit:
+    https://adaptivecards.io/explorer/Action.Submit.html
+    """
+    type: Literal["Action.Submit"] = "Action.Submit"
+    id: str = Field(description="Unique action identifier")
+    title: str = Field(description="Button label text")
+    style: ActionStyle = Field(
+        default=ActionStyle.DEFAULT,
+        description="Visual style"
+    )
+    data: dict[str, Any] = Field(
+        default_factory=dict,
+        description="Payload sent to server when action is triggered"
+    )
+    tooltip: str | None = Field(
+        default=None,
+        description="Tooltip text on hover"
+    )
+    icon_url: str | None = Field(
+        default=None,
+        description="Optional icon URL"
+    )
+class ActionOpenUrl(BaseModel):
+    """
+    Open URL action - navigates to external URL.
+    Inspired by Adaptive Cards Action.OpenUrl:
+    https://adaptivecards.io/explorer/Action.OpenUrl.html
+    """
+    type: Literal["Action.OpenUrl"] = "Action.OpenUrl"
+    id: str = Field(description="Unique action identifier")
+    title: str = Field(description="Button label text")
+    url: str = Field(description="URL to open")
+    style: ActionStyle = Field(default=ActionStyle.DEFAULT)
+    tooltip: str | None = None
+class ActionShowCard(BaseModel):
+    """
+    Show card action - reveals nested content inline.
+    Inspired by Adaptive Cards Action.ShowCard:
+    https://adaptivecards.io/explorer/Action.ShowCard.html
+    """
+    type: Literal["Action.ShowCard"] = "Action.ShowCard"
+    id: str = Field(description="Unique action identifier")
+    title: str = Field(description="Button label text")
+    card: dict[str, Any] = Field(
+        description="Nested card content to reveal (Adaptive Card JSON)"
+    )
+    style: ActionStyle = Field(default=ActionStyle.DEFAULT)
+# Union type for all action types
+ActionType = ActionSubmit | ActionOpenUrl | ActionShowCard
+class InputText(BaseModel):
+    """Text input field for action cards."""
+    type: Literal["Input.Text"] = "Input.Text"
+    id: str = Field(description="Input field identifier (used in submit payload)")
+    label: str | None = Field(default=None, description="Input label")
+    placeholder: str | None = Field(default=None, description="Placeholder text")
+    is_required: bool = Field(default=False, description="Whether input is required")
+    is_multiline: bool = Field(default=False, description="Multi-line text area")
+    max_length: int | None = Field(default=None, description="Maximum character length")
+    value: str | None = Field(default=None, description="Default value")
+class InputChoiceSet(BaseModel):
+    """Choice/select input for action cards."""
+    type: Literal["Input.ChoiceSet"] = "Input.ChoiceSet"
+    id: str = Field(description="Input field identifier")
+    label: str | None = None
+    choices: list[dict[str, str]] = Field(
+        description="List of {title, value} choice objects"
+    )
+    is_required: bool = False
+    is_multi_select: bool = Field(default=False, description="Allow multiple selections")
+    value: str | None = Field(default=None, description="Default selected value")
+class InputToggle(BaseModel):
+    """Toggle/checkbox input for action cards."""
+    type: Literal["Input.Toggle"] = "Input.Toggle"
+    id: str = Field(description="Input field identifier")
+    title: str = Field(description="Toggle label text")
+    value: str = Field(default="false", description="Current value ('true'/'false')")
+    value_on: str = Field(default="true", description="Value when toggled on")
+    value_off: str = Field(default="false", description="Value when toggled off")
+# Union type for all input types
+InputType = InputText | InputChoiceSet | InputToggle
+class ActionDisplayStyle(str, Enum):
+    """How to display the action request in the UI."""
+    INLINE = "inline"       # Rendered inline after message content
+    FLOATING = "floating"   # Floating panel/overlay
+    MODAL = "modal"         # Modal dialog
+class ActionRequestCard(BaseModel):
+    """
+    Action solicitation card - requests user input or action.
+    This is the main payload for action_request SSE events.
+    Uses Adaptive Cards-inspired schema for cross-platform UI compatibility.
+    Example use cases:
+    - Confirm/cancel dialogs
+    - Form inputs (name, email, etc.)
+    - Multi-choice selections
+    - Quick reply buttons
+    - Feedback collection (thumbs up/down)
+    Example:
+        ```json
+        {
+            "id": "confirm-delete-123",
+            "prompt": "Are you sure you want to delete this item?",
+            "display_style": "modal",
+            "actions": [
+                {
+                    "type": "Action.Submit",
+                    "id": "confirm",
+                    "title": "Delete",
+                    "style": "destructive",
+                    "data": {"action": "delete", "item_id": "123"}
+                },
+                {
+                    "type": "Action.Submit",
+                    "id": "cancel",
+                    "title": "Cancel",
+                    "style": "secondary",
+                    "data": {"action": "cancel"}
+                }
+            ],
+            "timeout_ms": 30000
+        }
+        ```
+    """
+    id: str = Field(description="Unique card identifier for response correlation")
+    prompt: str = Field(description="Prompt text explaining what action is requested")
+    display_style: ActionDisplayStyle = Field(
+        default=ActionDisplayStyle.INLINE,
+        description="How to display in the UI"
+    )
+    actions: list[ActionType] = Field(
+        default_factory=list,
+        description="Available actions (buttons)"
+    )
+    inputs: list[InputType] = Field(
+        default_factory=list,
+        description="Input fields for data collection"
+    )
+    timeout_ms: int | None = Field(
+        default=None,
+        description="Auto-dismiss timeout in milliseconds"
+    )
+    fallback_text: str | None = Field(
+        default=None,
+        description="Text to show if card rendering fails"
+    )
+# =============================================================================
+# SSE Event Payloads
+# =============================================================================
+class TextDeltaEvent(BaseModel):
+    """Text content delta event (OpenAI-compatible)."""
+    type: Literal["text_delta"] = "text_delta"
+    content: str = Field(description="Text content chunk")
+class ReasoningEvent(BaseModel):
+    """
+    Reasoning/thinking event.
+    Used to stream model's chain-of-thought reasoning separate from
+    the main response content. UI can display this in a collapsible
+    "thinking" section.
+    """
+    type: Literal["reasoning"] = "reasoning"
+    content: str = Field(description="Reasoning text chunk")
+    step: int | None = Field(
+        default=None,
+        description="Reasoning step number (for multi-step reasoning)"
+    )
+class ActionRequestEvent(BaseModel):
+    """
+    Action request event - solicits user action.
+    Sent when the agent needs user input or confirmation.
+    """
+    type: Literal["action_request"] = "action_request"
+    card: ActionRequestCard = Field(description="Action card definition")
+class MetadataEvent(BaseModel):
+    """
+    Metadata event - system information (often hidden from user).
+    Used for confidence scores, sources, model info, message IDs, etc.
+    """
+    type: Literal["metadata"] = "metadata"
+    # Message correlation IDs
+    message_id: str | None = Field(
+        default=None,
+        description="Database ID of the assistant message being streamed"
+    )
+    in_reply_to: str | None = Field(
+        default=None,
+        description="Database ID of the user message this is responding to"
+    )
+    session_id: str | None = Field(
+        default=None,
+        description="Session ID for this conversation"
+    )
+    # Agent info
+    agent_schema: str | None = Field(
+        default=None,
+        description="Name of the agent schema used for this response (e.g., 'rem', 'query-assistant')"
+    )
+    # Session info
+    session_name: str | None = Field(
+        default=None,
+        description="Short 1-3 phrase name for the session topic (e.g., 'Prescription Drug Questions', 'AWS Setup Help')"
+    )
+    # Quality indicators
+    confidence: float | None = Field(
+        default=None, ge=0, le=1,
+        description="Confidence score (0-1)"
+    )
+    sources: list[str] | None = Field(
+        default=None,
+        description="Referenced sources/citations"
+    )
+    # Model info
+    model_version: str | None = Field(
+        default=None,
+        description="Model version used"
+    )
+    # Performance metrics
+    latency_ms: int | None = Field(
+        default=None,
+        description="Response latency in milliseconds"
+    )
+    token_count: int | None = Field(
+        default=None,
+        description="Token count for this response"
+    )
+    # Trace context for observability (deterministic, captured from OTEL)
+    trace_id: str | None = Field(
+        default=None,
+        description="OTEL trace ID for correlating with Phoenix/observability systems"
+    )
+    span_id: str | None = Field(
+        default=None,
+        description="OTEL span ID for correlating with Phoenix/observability systems"
+    )
+    # System flags
+    flags: list[str] | None = Field(
+        default=None,
+        description="System flags (e.g., 'uncertain', 'needs_review')"
+    )
+    hidden: bool = Field(
+        default=False,
+        description="If true, should not be displayed to user"
+    )
+    extra: dict[str, Any] | None = Field(
+        default=None,
+        description="Additional metadata"
+    )
+class ProgressEvent(BaseModel):
+    """Progress indicator event."""
+    type: Literal["progress"] = "progress"
+    step: int = Field(description="Current step number")
+    total_steps: int = Field(description="Total number of steps")
+    label: str = Field(description="Step description")
+    status: Literal["pending", "in_progress", "completed", "failed"] = Field(
+        description="Step status"
+    )
+class ToolCallEvent(BaseModel):
+    """Tool invocation event."""
+    type: Literal["tool_call"] = "tool_call"
+    tool_name: str = Field(description="Name of tool being called")
+    tool_id: str | None = Field(
+        default=None,
+        description="Unique call identifier"
+    )
+    status: Literal["started", "completed", "failed"] = Field(
+        description="Tool call status"
+    )
+    arguments: dict[str, Any] | None = Field(
+        default=None,
+        description="Tool arguments (for 'started' status)"
+    )
+    result: str | None = Field(
+        default=None,
+        description="Tool result summary (for 'completed' status)"
+    )
+    error: str | None = Field(
+        default=None,
+        description="Error message (for 'failed' status)"
+    )
+class ErrorEvent(BaseModel):
+    """Error notification event."""
+    type: Literal["error"] = "error"
+    code: str = Field(description="Error code")
+    message: str = Field(description="Human-readable error message")
+    details: dict[str, Any] | None = Field(
+        default=None,
+        description="Additional error details"
+    )
+    recoverable: bool = Field(
+        default=True,
+        description="Whether error is recoverable"
+    )
+class DoneEvent(BaseModel):
+    """Stream completion event."""
+    type: Literal["done"] = "done"
+    reason: Literal["stop", "length", "error", "cancelled"] = Field(
+        default="stop",
+        description="Completion reason"
+    )
+# Union type for all SSE events
+SSEEvent = (
+    TextDeltaEvent
+    | ReasoningEvent
+    | ActionRequestEvent
+    | MetadataEvent
+    | ProgressEvent
+    | ToolCallEvent
+    | ErrorEvent
+    | DoneEvent
+)
+# =============================================================================
+# SSE Formatting Helpers
+# =============================================================================
+def format_sse_event(event: SSEEvent) -> str:
+    """
+    Format an SSE event for transmission.
+    Standard data: format for text_delta (OpenAI compatibility).
+    Named event: format for other event types.
+    Args:
+        event: SSE event to format
+    Returns:
+        Formatted SSE string ready for transmission
+    Example:
+        >>> event = ReasoningEvent(content="Analyzing...")
+        >>> format_sse_event(event)
+        'event: reasoning\\ndata: {"type": "reasoning", "content": "Analyzing..."}\\n\\n'
+    """
+    import json
+    event_json = event.model_dump_json()
+    # TextDeltaEvent uses standard data: format for OpenAI compatibility
+    if isinstance(event, TextDeltaEvent):
+        return f"data: {event_json}\n\n"
+    # DoneEvent uses special marker
+    if isinstance(event, DoneEvent):
+        return f"event: done\ndata: {event_json}\n\n"
+    # All other events use named event format
+    event_type = event.type
+    return f"event: {event_type}\ndata: {event_json}\n\n"
+def format_openai_sse_chunk(
+    request_id: str,
+    created: int,
+    model: str,
+    content: str | None = None,
+    role: str | None = None,
+    finish_reason: str | None = None,
+) -> str:
+    """
+    Format OpenAI-compatible SSE chunk.
+    Args:
+        request_id: Request/response ID
+        created: Unix timestamp
+        model: Model name
+        content: Delta content
+        role: Message role (usually 'assistant')
+        finish_reason: Finish reason (e.g., 'stop')
+    Returns:
+        Formatted SSE data line
+    """
+    import json
+    delta = {}
+    if role:
+        delta["role"] = role
+    if content is not None:
+        delta["content"] = content
+    chunk = {
+        "id": request_id,
+        "object": "chat.completion.chunk",
+        "created": created,
+        "model": model,
+        "choices": [{
+            "index": 0,
+            "delta": delta,
+            "finish_reason": finish_reason
+        }]
+    }
+    return f"data: {json.dumps(chunk)}\n\n"

remdb 0.3.7__py3-none-any.whl → 0.3.133__py3-none-any.whl

remdb 0.3.7py3-none-any.whl → 0.3.133py3-none-any.whl