PyPI - octostar-python-client - Versions diffs - 0.1.759__py3-none-any.whl - Mend

octostar-python-client 0.1.759__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (257) hide show

octostar/__init__.py +9 -0
octostar/api/__init__.py +1 -0
octostar/api/apps/__init__.py +0 -0
octostar/api/apps/deploy_app.py +210 -0
octostar/api/apps/execute_app_job.py +188 -0
octostar/api/apps/get_app_logs.py +210 -0
octostar/api/apps/get_apps_url.py +188 -0
octostar/api/apps/get_job_logs.py +210 -0
octostar/api/apps/get_job_progress.py +162 -0
octostar/api/apps/kill_job.py +160 -0
octostar/api/apps/list_app_jobs.py +276 -0
octostar/api/apps/list_apps.py +251 -0
octostar/api/apps/set_job_progress.py +216 -0
octostar/api/apps/undeploy_app.py +160 -0
octostar/api/metadata/__init__.py +0 -0
octostar/api/metadata/get_version.py +232 -0
octostar/api/metadata/get_whoami.py +232 -0
octostar/api/notifications/__init__.py +0 -0
octostar/api/notifications/delete_stream.py +222 -0
octostar/api/notifications/get_subscriptions.py +240 -0
octostar/api/notifications/publish_notification.py +275 -0
octostar/api/notifications/pull_events_from_stream.py +282 -0
octostar/api/notifications/push_event_to_stream.py +265 -0
octostar/api/notifications/toast.py +264 -0
octostar/api/ontology/__init__.py +0 -0
octostar/api/ontology/fetch_ontology_data.py +275 -0
octostar/api/ontology/get_ontologies.py +237 -0
octostar/api/ontology/multi_query.py +297 -0
octostar/api/ontology/query.py +276 -0
octostar/api/pipeline/__init__.py +1 -0
octostar/api/pipeline/get_processing_status.py +185 -0
octostar/api/pipeline/update_processing_status.py +164 -0
octostar/api/search/__init__.py +0 -0
octostar/api/search/get_annotations.py +153 -0
octostar/api/workspace_data/__init__.py +0 -0
octostar/api/workspace_data/delete_blob.py +212 -0
octostar/api/workspace_data/delete_entities.py +326 -0
octostar/api/workspace_data/download_blob.py +235 -0
octostar/api/workspace_data/get_attachment.py +336 -0
octostar/api/workspace_data/get_files_tree.py +397 -0
octostar/api/workspace_data/upload_blob.py +235 -0
octostar/api/workspace_data/upsert_entities.py +284 -0
octostar/api/workspace_permissions/__init__.py +0 -0
octostar/api/workspace_permissions/get_permissions.py +325 -0
octostar/api/workspace_tags/__init__.py +0 -0
octostar/api/workspace_tags/delete_tag_from_entities.py +141 -0
octostar/api/workspace_tags/tag_entities.py +180 -0
octostar/client.py +492 -0
octostar/errors.py +50 -0
octostar/models/__init__.py +249 -0
octostar/models/acknowledgement.py +74 -0
octostar/models/acknowledgement_with_data.py +82 -0
octostar/models/app_status.py +239 -0
octostar/models/app_status_annotations.py +66 -0
octostar/models/app_status_labels.py +69 -0
octostar/models/app_with_url.py +82 -0
octostar/models/child_processing_status.py +118 -0
octostar/models/delete_entities_response_401.py +74 -0
octostar/models/delete_entities_response_409.py +82 -0
octostar/models/delete_entities_response_500.py +82 -0
octostar/models/delete_stream_response_401.py +74 -0
octostar/models/delete_tag_from_entities_response_401.py +74 -0
octostar/models/deploy_app_json_body.py +90 -0
octostar/models/deploy_app_json_body_secrets.py +65 -0
octostar/models/deploy_app_response_200.py +98 -0
octostar/models/deploy_app_response_200_data.py +60 -0
octostar/models/deploy_app_response_400.py +82 -0
octostar/models/deploy_app_response_403.py +82 -0
octostar/models/deploy_app_response_404.py +82 -0
octostar/models/deploy_app_response_409.py +82 -0
octostar/models/deploy_app_response_500.py +82 -0
octostar/models/entity.py +80 -0
octostar/models/entity_response.py +99 -0
octostar/models/entity_response_s3_urls.py +93 -0
octostar/models/entity_response_s3_urls_additional_property.py +105 -0
octostar/models/entity_response_s3_urls_additional_property_fields.py +114 -0
octostar/models/execute_app_job_json_body.py +151 -0
octostar/models/execute_app_job_json_body_annotation.py +65 -0
octostar/models/execute_app_job_response_401.py +74 -0
octostar/models/fetch_ontology_data_response_200.py +60 -0
octostar/models/fetch_ontology_data_response_401.py +74 -0
octostar/models/fetch_ontology_data_response_500.py +82 -0
octostar/models/get_app_logs_response_401.py +74 -0
octostar/models/get_app_logs_response_404.py +74 -0
octostar/models/get_app_logs_response_500.py +82 -0
octostar/models/get_apps_url_json_body.py +76 -0
octostar/models/get_apps_url_response_401.py +74 -0
octostar/models/get_apps_url_response_500.py +82 -0
octostar/models/get_attachment_response_200.py +74 -0
octostar/models/get_attachment_response_401.py +74 -0
octostar/models/get_files_tree_response_200.py +106 -0
octostar/models/get_files_tree_response_200_status.py +8 -0
octostar/models/get_files_tree_response_400.py +111 -0
octostar/models/get_files_tree_response_400_data.py +60 -0
octostar/models/get_files_tree_response_400_status.py +8 -0
octostar/models/get_files_tree_response_401.py +74 -0
octostar/models/get_files_tree_response_500.py +111 -0
octostar/models/get_files_tree_response_500_data.py +60 -0
octostar/models/get_files_tree_response_500_status.py +8 -0
octostar/models/get_job_logs_response_401.py +74 -0
octostar/models/get_job_logs_response_404.py +74 -0
octostar/models/get_job_logs_response_500.py +82 -0
octostar/models/get_job_progress_response_401.py +74 -0
octostar/models/get_object_response_401.py +74 -0
octostar/models/get_ontologies_response_401.py +74 -0
octostar/models/get_ontologies_response_500.py +81 -0
octostar/models/get_permissions_response_200.py +98 -0
octostar/models/get_permissions_response_400.py +82 -0
octostar/models/get_permissions_response_401.py +74 -0
octostar/models/get_permissions_response_500.py +82 -0
octostar/models/get_processing_status_response_200.py +104 -0
octostar/models/get_processing_status_response_200_data.py +87 -0
octostar/models/get_processing_status_response_400.py +82 -0
octostar/models/get_processing_status_response_500.py +82 -0
octostar/models/get_subscriptions_response_200_item.py +74 -0
octostar/models/get_version_response_200.py +74 -0
octostar/models/get_version_response_404.py +74 -0
octostar/models/get_whoami_response_200.py +129 -0
octostar/models/get_whoami_response_401.py +74 -0
octostar/models/insert_entity.py +114 -0
octostar/models/insert_entity_base.py +266 -0
octostar/models/insert_entity_relationships_item.py +107 -0
octostar/models/insert_entity_request.py +94 -0
octostar/models/internal_server_error.py +82 -0
octostar/models/job_execution_result.py +146 -0
octostar/models/job_status.py +196 -0
octostar/models/job_status_labels.py +60 -0
octostar/models/job_with_url.py +82 -0
octostar/models/kill_job_response_401.py +74 -0
octostar/models/list_app_jobs_response_401.py +74 -0
octostar/models/list_app_jobs_response_500.py +82 -0
octostar/models/list_apps_response_401.py +74 -0
octostar/models/list_apps_response_500.py +82 -0
octostar/models/multi_query_json_body.py +100 -0
octostar/models/multi_query_json_body_queries_item.py +80 -0
octostar/models/multi_query_response_400.py +82 -0
octostar/models/multi_query_response_401.py +74 -0
octostar/models/not_found_error.py +74 -0
octostar/models/octostar_event.py +96 -0
octostar/models/octostar_event_octostar_payload.py +100 -0
octostar/models/octostar_event_octostar_payload_level.py +11 -0
octostar/models/os_notification.py +122 -0
octostar/models/processing_status.py +262 -0
octostar/models/processing_status_code.py +14 -0
octostar/models/progress_request.py +73 -0
octostar/models/publish_notification_response_401.py +74 -0
octostar/models/pull_events_from_stream_response_401.py +74 -0
octostar/models/push_event_to_stream_response_401.py +74 -0
octostar/models/query_json_body.py +101 -0
octostar/models/query_json_body_params.py +60 -0
octostar/models/query_response_400.py +82 -0
octostar/models/query_response_401.py +74 -0
octostar/models/set_job_progress_response_401.py +74 -0
octostar/models/string_to_value_label_map.py +99 -0
octostar/models/string_to_value_label_map_data.py +89 -0
octostar/models/string_to_value_label_map_data_additional_property.py +80 -0
octostar/models/successful_get_tags.py +103 -0
octostar/models/successful_insertion.py +98 -0
octostar/models/tag_entities_response_401.py +74 -0
octostar/models/toast_level.py +11 -0
octostar/models/toast_response_401.py +74 -0
octostar/models/undeploy_app_response_401.py +74 -0
octostar/models/update_processing_status_response_200.py +82 -0
octostar/models/update_processing_status_response_400.py +82 -0
octostar/models/update_processing_status_response_500.py +82 -0
octostar/models/upsert_entities_response_401.py +74 -0
octostar/models/upsert_entity.py +114 -0
octostar/models/upsert_entity_base.py +266 -0
octostar/models/upsert_entity_relationships_item.py +107 -0
octostar/py.typed +1 -0
octostar/types.py +54 -0
octostar/utils/__init__.py +15 -0
octostar/utils/chat/__init__.py +0 -0
octostar/utils/chat/chat.py +513 -0
octostar/utils/chat/detokenize.py +105 -0
octostar/utils/chat/get_default_model.py +50 -0
octostar/utils/chat/list_models.py +91 -0
octostar/utils/chat/tokenize.py +105 -0
octostar/utils/commons.py +226 -0
octostar/utils/exceptions.py +134 -0
octostar/utils/jobs/__init__.py +0 -0
octostar/utils/jobs/apps/__init__.py +0 -0
octostar/utils/jobs/apps/deploy_app.py +81 -0
octostar/utils/jobs/apps/execute_app_job.py +114 -0
octostar/utils/jobs/apps/get_app_logs.py +113 -0
octostar/utils/jobs/apps/get_app_secret.py +102 -0
octostar/utils/jobs/apps/get_apps_url.py +73 -0
octostar/utils/jobs/apps/list_app_jobs.py +62 -0
octostar/utils/jobs/apps/list_apps.py +126 -0
octostar/utils/jobs/apps/undeploy_app.py +48 -0
octostar/utils/jobs/get_job_logs.py +113 -0
octostar/utils/jobs/get_job_progress.py +76 -0
octostar/utils/jobs/kill_job.py +47 -0
octostar/utils/jobs/set_job_progress.py +67 -0
octostar/utils/meta/__init__.py +0 -0
octostar/utils/meta/get_version.py +30 -0
octostar/utils/meta/get_whoami.py +30 -0
octostar/utils/notifications/__init__.py +0 -0
octostar/utils/notifications/delete_stream.py +58 -0
octostar/utils/notifications/get_my_subscriptions.py +49 -0
octostar/utils/notifications/publish_notification.py +73 -0
octostar/utils/notifications/pull_event_from_stream.py +63 -0
octostar/utils/notifications/pull_events_from_stream.py +64 -0
octostar/utils/notifications/push_event_to_stream.py +109 -0
octostar/utils/notifications/push_events_to_stream.py +137 -0
octostar/utils/notifications/toast.py +92 -0
octostar/utils/ontology/__init__.py +10 -0
octostar/utils/ontology/fetch_ontology_data.py +141 -0
octostar/utils/ontology/get_ontologies.py +55 -0
octostar/utils/ontology/multiquery_ontology.py +287 -0
octostar/utils/ontology/query_ontology.py +186 -0
octostar/utils/pipeline/__init__.py +1 -0
octostar/utils/pipeline/get_processing_status.py +230 -0
octostar/utils/pipeline/update_processing_status.py +286 -0
octostar/utils/search/__init__.py +11 -0
octostar/utils/search/bulk_update.py +138 -0
octostar/utils/search/count.py +117 -0
octostar/utils/search/get_entity_annotations.py +304 -0
octostar/utils/search/get_index_definition.py +111 -0
octostar/utils/search/multi_search.py +129 -0
octostar/utils/workspace/__init__.py +0 -0
octostar/utils/workspace/delete_entities.py +247 -0
octostar/utils/workspace/delete_entity.py +81 -0
octostar/utils/workspace/delete_relationship.py +78 -0
octostar/utils/workspace/delete_relationships.py +85 -0
octostar/utils/workspace/delete_temporary_blob.py +85 -0
octostar/utils/workspace/extract_entities.py +140 -0
octostar/utils/workspace/get_filepath_from_item.py +85 -0
octostar/utils/workspace/get_filepaths_from_items.py +100 -0
octostar/utils/workspace/get_files_tree.py +102 -0
octostar/utils/workspace/get_item_from_filepath.py +102 -0
octostar/utils/workspace/get_items_from_filepaths.py +108 -0
octostar/utils/workspace/linkcharts/__init__.py +0 -0
octostar/utils/workspace/linkcharts/create_linkchart.py +241 -0
octostar/utils/workspace/permissions/PermissionLevel.py +8 -0
octostar/utils/workspace/permissions/__init__.py +1 -0
octostar/utils/workspace/permissions/get_permissions.py +81 -0
octostar/utils/workspace/read_attachment.py +284 -0
octostar/utils/workspace/read_file.py +113 -0
octostar/utils/workspace/read_temporary_blob.py +428 -0
octostar/utils/workspace/saved_searches/__init__.py +0 -0
octostar/utils/workspace/saved_searches/create_saved_search.py +183 -0
octostar/utils/workspace/tags/__init__.py +0 -0
octostar/utils/workspace/tags/delete_tag_from_entities.py +96 -0
octostar/utils/workspace/tags/tag_entities.py +175 -0
octostar/utils/workspace/upsert_entities.py +268 -0
octostar/utils/workspace/upsert_entity.py +110 -0
octostar/utils/workspace/upsert_relationship.py +128 -0
octostar/utils/workspace/upsert_relationships.py +194 -0
octostar/utils/workspace/write_attachment.py +263 -0
octostar/utils/workspace/write_file.py +335 -0
octostar/utils/workspace/write_temporary_blob.py +218 -0
octostar_python_client-0.1.759.dist-info/METADATA +159 -0
octostar_python_client-0.1.759.dist-info/RECORD +257 -0
octostar_python_client-0.1.759.dist-info/WHEEL +5 -0
octostar_python_client-0.1.759.dist-info/licenses/LICENSE +21 -0
octostar_python_client-0.1.759.dist-info/top_level.txt +1 -0

octostar/utils/chat/chat.py ADDED Viewed

@@ -0,0 +1,513 @@
+import asyncio as _asyncio
+import httpx
+from collections.abc import AsyncIterator, Callable
+from typing import Optional, List, Any, Literal, Union, Dict, TypedDict
+from pydantic import BaseModel, Field, ValidationError
+from datetime import datetime
+from enum import Enum
+import json
+import logging
+from ...client import Client, get_default_client
+from ..exceptions import ApiConnectionError, StopAsyncIterationWithResult
+from ..commons import network_retry_strategy, TimeoutAsyncGenerator
+_logger = logging.getLogger(__name__)
+class EntityBase(BaseModel):
+    class Config:
+        extra = "allow"
+    entity_type: str = "os_workspace"
+    entity_id: str
+    entity_label: Optional[str] = None
+class SearchSetModel(BaseModel):
+    entity_id: str
+    entity_label: str
+    query: dict
+class ChatMessagePriority(Enum):
+    CRITICAL = 0
+    CONTEXTUAL = 1
+    HISTORICAL = 2
+ContextMode = Literal["limited_to_context", "context_boosted"]
+class ToolName(TypedDict):
+    source: str
+    name: str
+class ExecutionMode(str, Enum):
+    """The execution mode for a chat request."""
+    COMPLETION = "completion"
+    """Pure pass-through: no system prompt or processing, just forwards messages to the LLM."""
+    SIMPLE = "simple"
+    """Basic chat with a system prompt, but no RAG retrieval or tool usage."""
+    AGENTIC = "agentic"
+    """Full agent: formulates a plan, retrieves context via RAG, and invokes tools as needed."""
+class ChatMessage(BaseModel):
+    """
+    Represents a single chat message in the conversation. Class is taken from octostar-api lib.
+    """
+    id: str = Field(..., description="The unique ID of the message.")
+    role: str = Field(
+        ...,
+        description="The role of the message sender. Must be 'user', 'assistant', or 'system'.",
+    )
+    content: Union[List[EntityBase], SearchSetModel, str, Dict[str, Any]] = Field(
+        ..., description="The content of the message."
+    )
+    type: Optional[
+        Literal[
+            "text",
+            "json",
+            "add_entities",
+            "remove_entities",
+            "add_search_set",
+            "remove_search_set",
+        ]
+    ] = Field(
+        None,
+        description=(
+            "The type of the message. Can be 'text', 'json', 'add_entities', 'remove_entities', 'add_search_set' or 'remove_search_set."
+        ),
+    )
+    timestamp: Optional[datetime] = Field(
+        None, description="The timestamp of the message in ISO 8601 format."
+    )
+class ChatStreamEvent(TypedDict, total=False):
+    """A single event from the streaming chat endpoint."""
+    channel: str
+    """The event channel: 'text', 'agentic', 'context', 'final_prompt', 'heartbeat', 'error', or 'status'."""
+    content: Any
+    """The event payload. For 'text' events this is the accumulated response text so far."""
+def _build_request(
+    prompt: str,
+    *,
+    chat_history: Optional[list[ChatMessage]],
+    workspaces: Optional[list[EntityBase]],
+    context_mode: str,
+    model_name: Optional[str],
+    execution_mode: ExecutionMode,
+    disabled_tools: Optional[list[ToolName]],
+    streaming: bool,
+    client: Client,
+    extra_body: Optional[dict] = None,
+) -> tuple:
+    """Build the endpoint URL, headers, and JSON body for the chat API.
+    Returns:
+        (endpoint_url, headers, body)
+    """
+    endpoint_url = f"{client.get_base_url_v1()}/api/v1/chat"
+    headers = {
+        "Content-Type": "application/json",
+        # ``.token`` lives on AuthenticatedClient (the runtime type); the
+        # param is annotated with the Client base for call-site flexibility.
+        "Authorization": f"Bearer {client.token}",  # pyright: ignore[reportAttributeAccessIssue]
+        "x-ontology": client.ontology,
+    }
+    ws_list = workspaces or []
+    ws_dicts = [ws.model_dump() for ws in ws_list]
+    for ws in ws_dicts:
+        if "os_workspace" not in ws:
+            ws["os_workspace"] = ws["entity_id"]
+    hist = chat_history or []
+    hist_dicts = [ch.model_dump() for ch in hist]
+    hist_dicts = [
+        {
+            **m,
+            "timestamp": (
+                m.get("timestamp", "").strftime("%Y-%m-%d %H:%M:%S")
+                if isinstance(m.get("timestamp"), datetime)
+                else None
+            ),
+        }
+        for m in hist_dicts
+    ]
+    body = {
+        **(extra_body or {}),
+        "model_name": model_name,
+        "messages": hist_dicts,
+        "prompt": prompt,
+        "streaming": streaming,
+        "execution_mode": execution_mode,
+        "context_mode": context_mode,
+        "api_key": "",
+        "cohere_key": "",
+        "open_workspaces": ws_dicts,
+        "disabled_tools": disabled_tools or [],
+        "deployment_url": client.get_base_url_v1(),
+        **(
+            {} if "prompt_overrides" in (extra_body or {}) else {"prompt_overrides": {}}
+        ),
+    }
+    return endpoint_url, headers, body
+def _parse_response(message, response_validation):
+    if response_validation == "json" or (
+        isinstance(response_validation, type)
+        and issubclass(response_validation, BaseModel)
+    ):
+        message = message.strip()
+        if message.startswith("```json"):
+            message = message[7:]
+        if message.startswith("```"):
+            message = message[3:]
+        if message.endswith("```"):
+            message = message[:-3]
+        try:
+            message = json.loads(message)
+        except json.JSONDecodeError as e:
+            raise ValueError(f"Response is not valid JSON: {e}\nContent: {message}")
+        if response_validation == "json":
+            return message
+        elif isinstance(response_validation, type) and issubclass(
+            response_validation, BaseModel
+        ):
+            try:
+                return response_validation.model_validate(message)
+            except ValidationError as e:
+                raise ValueError(
+                    f"Response does not match schema {response_validation.__name__}: {e}\nContent: {message}"
+                )
+        else:
+            return message
+    else:
+        return message
+def sync(
+    prompt: str,
+    chat_history: Optional[list[ChatMessage]] = None,
+    workspaces: Optional[list[EntityBase]] = None,
+    context_mode: Literal["limited_to_context", "context_boosted"] = "context_boosted",
+    model_name: Optional[str] = None,
+    timeout: Optional[float] = 300.0,
+    retries: int = 2,
+    disabled_tools: Optional[list[ToolName]] = None,
+    execution_mode: ExecutionMode = ExecutionMode.COMPLETION,
+    response_validation: Union[None, Literal["json"], type[BaseModel]] = None,
+    client: Optional[Client] = None,
+    **kwargs,
+) -> Union[str, dict, list, BaseModel]:
+    """
+    # Make a request for the AI chat endpoint.
+    ## Arguments
+    - `prompt`: The user prompt to send to the chatbot.
+    - `chat_history`: The list of messages that precede the user prompt.
+    - `workspaces`: The list of workspaces the chatbot is able to see.
+    - `context_mode`: The filtering mode for entities retrieved by the chatbot using RAG. Can be set to:
+        * 'context_boosted': The context provided in the chat history is boosted in the RAG results,
+            but results from the whole knowledge base can be retrieved;
+        * 'limited_to_context': Only context provided in the chat history can be retrieved and used via RAG.
+    - `timeout`: The timeout for the connection to the search engine. Can be set to "None" for no enforced timeout.
+    - `retries`: The number of connection retries. Note that each retry may cost additional tokens.
+    - `disabled_tools`: A list of tools that the LLM is banned from using for this invocation.
+    - `execution_mode`: The mode with which the LLM will answer. Defaults to
+        'completion'. Only 'completion' is supported — 'simple' and 'agentic'
+        are deprecated and rejected by the backend with HTTP 400:
+        * 'completion': Pure pass-through — no system prompt or processing, just forwards messages to the LLM;
+    - `response_validation`: Whether the response should follow a given pattern. Possible values are:
+        * None: No validation on the response;
+        * 'json': Response is validated to be a JSON;
+        * type[BaseModel]: Response is validated against the given pydantic model class;
+    - `client`: The Client with which to connect to Octostar. If None, the default one is used.
+    - `**kwargs`: Additional keyword arguments are merged into the request body.
+        Explicit parameters above take precedence over kwargs.
+    ## Returns
+    The chatbot response, as plain text.
+    ## Raises
+    - `ApiConnectionError`: If the query was unsuccessful.
+    """
+    if not client:
+        client = get_default_client()
+    endpoint_url, headers, body = _build_request(
+        prompt,
+        chat_history=chat_history,
+        workspaces=workspaces,
+        context_mode=context_mode,
+        model_name=model_name,
+        execution_mode=execution_mode,
+        disabled_tools=disabled_tools,
+        streaming=False,
+        client=client,
+        extra_body=kwargs,
+    )
+    response = None
+    try:
+        for attempt in network_retry_strategy(retries=retries):
+            with attempt:
+                with httpx.Client() as httpx_client:
+                    response = httpx_client.post(
+                        endpoint_url, json=body, headers=headers, timeout=timeout
+                    )
+                    response.raise_for_status()
+                try:
+                    chatbot_response = response.json()["response"]["content"]
+                except Exception as e:
+                    raise ConnectionError(
+                        f"Unparsable response format {response.content} with exception {e}"
+                    )
+                try:
+                    chatbot_response = _parse_response(
+                        chatbot_response, response_validation
+                    )
+                except Exception as e:
+                    raise ConnectionError(
+                        f"Validation failed for {chatbot_response} with exception {e}"
+                    )
+    except Exception:
+        raise ApiConnectionError("chat", response, client)
+    return chatbot_response
+async def asyncio(
+    prompt: str,
+    chat_history: Optional[list[ChatMessage]] = None,
+    workspaces: Optional[list[EntityBase]] = None,
+    context_mode: Literal["limited_to_context", "context_boosted"] = "context_boosted",
+    model_name: Optional[str] = None,
+    timeout: Optional[float] = 300.0,
+    retries: int = 2,
+    disabled_tools: Optional[list[ToolName]] = None,
+    execution_mode: ExecutionMode = ExecutionMode.COMPLETION,
+    response_validation: Union[None, Literal["json"], type[BaseModel]] = None,
+    client: Optional[Client] = None,
+    **kwargs,
+) -> Union[str, dict, list, BaseModel]:
+    """
+    # Make asynchronously a request for the AI chat endpoint.
+    ## Arguments
+    - `prompt`: The user prompt to send to the chatbot.
+    - `chat_history`: The list of messages that precede the user prompt.
+    - `workspaces`: The list of workspaces the chatbot is able to see.
+    - `context_mode`: The filtering mode for entities retrieved by the chatbot using RAG. Can be set to:
+        * 'context_boosted': The context provided in the chat history is boosted in the RAG results,
+            but results from the whole knowledge base can be retrieved;
+        * 'limited_to_context': Only context provided in the chat history can be retrieved and used via RAG.
+    - `timeout`: The timeout for the connection to the search engine. Can be set to "None" for no enforced timeout.
+    - `retries`: The number of connection retries. Note that each retry may cost additional tokens.
+    - `disabled_tools`: A list of tools that the LLM is banned from using for this invocation.
+    - `execution_mode`: The mode with which the LLM will answer. Defaults to
+        'completion'. Only 'completion' is supported — 'simple' and 'agentic'
+        are deprecated and rejected by the backend with HTTP 400:
+        * 'completion': Pure pass-through — no system prompt or processing, just forwards messages to the LLM;
+    - `response_validation`: Whether the response should follow a given pattern. Possible values are:
+        * None: No validation on the response, response is in plain text;
+        * 'json': Response is validated to be a JSON, and returned as a dict;
+        * type[BaseModel]: Response is validated against the given pydantic model class, and returned as an instance of that class;
+    - `client`: The Client with which to connect to Octostar. If None, the default one is used.
+    - `**kwargs`: Additional keyword arguments are merged into the request body.
+        Explicit parameters above take precedence over kwargs.
+    ## Returns
+    The chatbot response, parsed or as plain text.
+    ## Raises
+    - `ApiConnectionError`: If the query was unsuccessful.
+    """
+    if not client:
+        client = get_default_client()
+    endpoint_url, headers, body = _build_request(
+        prompt,
+        chat_history=chat_history,
+        workspaces=workspaces,
+        context_mode=context_mode,
+        model_name=model_name,
+        execution_mode=execution_mode,
+        disabled_tools=disabled_tools,
+        streaming=False,
+        client=client,
+        extra_body=kwargs,
+    )
+    response = None
+    try:
+        for attempt in network_retry_strategy(retries=retries):
+            with attempt:
+                async with httpx.AsyncClient() as httpx_client:
+                    response = await httpx_client.post(
+                        endpoint_url, json=body, headers=headers, timeout=timeout
+                    )
+                    response.raise_for_status()
+                try:
+                    chatbot_response = response.json()["response"]["content"]
+                except Exception as e:
+                    raise ConnectionError(
+                        f"Unparsable response format {response.content} with exception {e}"
+                    )
+                try:
+                    chatbot_response = _parse_response(
+                        chatbot_response, response_validation
+                    )
+                except Exception as e:
+                    raise ConnectionError(
+                        f"Validation failed for {chatbot_response} with exception {e}"
+                    )
+    except Exception:
+        raise ApiConnectionError("chat", response, client)
+    return chatbot_response
+async def streaming(
+    prompt: str,
+    chat_history: Optional[list[ChatMessage]] = None,
+    workspaces: Optional[list[EntityBase]] = None,
+    context_mode: Literal["limited_to_context", "context_boosted"] = "context_boosted",
+    model_name: Optional[str] = None,
+    timeout: Optional[float] = 300.0,
+    disabled_tools: Optional[list[ToolName]] = None,
+    execution_mode: ExecutionMode = ExecutionMode.COMPLETION,
+    fail_condition: Optional[Callable[[List[ChatStreamEvent]], bool]] = None,
+    end_condition: Optional[Callable[[List[ChatStreamEvent]], bool]] = None,
+    client: Optional[Client] = None,
+    **kwargs,
+) -> AsyncIterator[Union[ChatStreamEvent, str]]:
+    """
+    # Stream a request to the AI chat endpoint.
+    Opens a streaming HTTP connection and yields parsed events as they arrive.
+    Each event is a `ChatStreamEvent` dict with a `channel` key indicating the
+    event type and a `content` key with the payload.
+    Catch `StopAsyncIterationWithResult` to get the final accumulated text
+    response after the stream ends::
+        try:
+            async for event in chat.streaming(prompt="Hello"):
+                print(event)          # process events in real-time
+        except StopAsyncIterationWithResult as r:
+            final_text = r.value      # the full response text
+    ## Arguments
+    - `prompt`: The user prompt to send to the chatbot.
+    - `chat_history`: The list of messages that precede the user prompt.
+    - `workspaces`: The list of workspaces the chatbot is able to see.
+    - `context_mode`: The filtering mode for entities retrieved by the chatbot using RAG. Can be set to:
+        * 'context_boosted': The context provided in the chat history is boosted in the RAG results,
+            but results from the whole knowledge base can be retrieved;
+        * 'limited_to_context': Only context provided in the chat history can be retrieved and used via RAG.
+    - `timeout`: The timeout for the connection to the search engine. Can be set to "None" for no enforced timeout.
+    - `disabled_tools`: A list of tools that the LLM is banned from using for this invocation.
+    - `execution_mode`: The mode with which the LLM will answer. Defaults to
+        'completion'. Only 'completion' is supported — 'simple' and 'agentic'
+        are deprecated and rejected by the backend with HTTP 400:
+        * 'completion': Pure pass-through — no system prompt or processing, just forwards messages to the LLM;
+    - `fail_condition`: Custom condition to determine when the stream should be considered
+        failed. Receives the list of ChatStreamEvent dicts collected so far and returns
+        True to trigger an ApiConnectionError. If None, defaults to failing on events
+        with channel ``'error'``.
+    - `end_condition`: Custom condition to determine when the stream should stop early.
+        Receives the list of ChatStreamEvent dicts collected so far and returns True to
+        end the stream. If None, defaults to streaming until completion (or timeout).
+    - `client`: The Client with which to connect to Octostar. If None, the default one is used.
+    - `**kwargs`: Additional keyword arguments are merged into the request body.
+        Explicit parameters above take precedence over kwargs.
+    ## Yields
+    `ChatStreamEvent` dicts. Common channels:
+    - `'text'`: Accumulated generated text so far.
+    - `'agentic'`: Tool-call or agent status updates.
+    - `'context'`: RAG context entities retrieved.
+    - `'final_prompt'`: The full prompt sent to the LLM.
+    - `'heartbeat'`: Keep-alive pings (can be ignored).
+    - `'error'`: Error messages from the server.
+    ## Raises
+    - `StopAsyncIterationWithResult`: When the stream ends normally. `value` holds
+        the final accumulated text response (``str``).
+    - `ApiConnectionError`: If the connection or initial response failed, or the
+        fail_condition returned True.
+    """
+    if fail_condition is None:
+        fail_condition = lambda events: any(e.get("channel") == "error" for e in events)
+    if end_condition is None:
+        end_condition = lambda _events: False
+    if not client:
+        client = get_default_client()
+    endpoint_url, headers, body = _build_request(
+        prompt,
+        chat_history=chat_history,
+        workspaces=workspaces,
+        context_mode=context_mode,
+        model_name=model_name,
+        execution_mode=execution_mode,
+        disabled_tools=disabled_tools,
+        streaming=True,
+        client=client,
+        extra_body=kwargs,
+    )
+    async def _parse_lines(resp: httpx.Response) -> AsyncIterator[ChatStreamEvent]:
+        async for line in resp.aiter_lines():
+            if not line.strip():
+                continue
+            try:
+                yield json.loads(line)
+            except json.JSONDecodeError:
+                _logger.warning("chat streaming: unparsable line: %s", line[:200])
+    collected_events: List[ChatStreamEvent] = []
+    accumulated_text = ""
+    try:
+        async with httpx.AsyncClient() as httpx_client:
+            async with httpx_client.stream(
+                "POST", endpoint_url, json=body, headers=headers, timeout=timeout
+            ) as response:
+                if response.status_code != 200:
+                    await response.aread()
+                    raise ConnectionError(
+                        f"chat streaming: HTTP {response.status_code}: {response.text[:500]}"
+                    )
+                event_stream = _parse_lines(response)
+                if timeout is not None:
+                    event_stream = TimeoutAsyncGenerator(event_stream, timeout)
+                try:
+                    async for event in event_stream:
+                        collected_events.append(event)
+                        if event.get("channel") == "text":
+                            accumulated_text += event.get("content", "")
+                        if fail_condition(collected_events):
+                            raise ConnectionError(
+                                "chat streaming: fail_condition triggered"
+                            )
+                        if end_condition(collected_events):
+                            break
+                        yield event
+                except _asyncio.TimeoutError:
+                    _logger.warning(
+                        "chat streaming: timed out after %s seconds", timeout
+                    )
+    except (ConnectionError, httpx.HTTPStatusError) as e:
+        raise ApiConnectionError("chat streaming", None, client) from e
+    raise StopAsyncIterationWithResult(value=accumulated_text)

octostar/utils/chat/detokenize.py ADDED Viewed

@@ -0,0 +1,105 @@
+import httpx
+from typing import Optional
+from ...client import Client, get_default_client
+from ..exceptions import ApiConnectionError
+from typing import Optional
+from ..commons import network_retry_strategy
+def _prepare_detokenize_request(client, tokens, model_name):
+    endpoint_url = f"{client.get_base_url_v1()}/api/v2/ai/llm/detokenize"
+    headers = {
+        "Authorization": f"Bearer {client.token}",
+        "x-ontology": client.ontology,
+    }
+    return {
+        "url": endpoint_url,
+        "headers": headers,
+        "timeout": 60,
+        "json": {
+            "tokens": tokens,
+            "model_name": model_name,
+        },
+    }
+def sync(
+    tokens: list[int],
+    model_name: str,
+    client: Optional[Client] = None,
+) -> str:
+    """
+    # Detokenize a list of LLM tokens into a string.
+    ## Arguments
+    - `tokens`: The input list of tokens.
+    - `model_name`: The model with which to detokenize the input text.
+    - `client`: The Client with which to connect to Octostar. If None, the default one is used.
+    ## Returns
+    The detokenized string.
+    ## Raises
+    - `ApiConnectionError`: If the query was unsuccessful.
+    """
+    if not client:
+        client = get_default_client()
+    response = None
+    try:
+        for attempt in network_retry_strategy(retries=3):
+            with attempt:
+                with httpx.Client() as httpx_client:
+                    response = httpx_client.post(
+                        **_prepare_detokenize_request(client, tokens, model_name)
+                    )
+                    response.raise_for_status()
+                try:
+                    response = response.json()["text"]
+                except Exception as e:
+                    raise ConnectionError(
+                        f"Unparsable response format {response.content} with exception {e}"
+                    )
+    except Exception:
+        raise ApiConnectionError("detokenize", response, client)
+    return response  # pyright: ignore[reportReturnType]
+async def asyncio(
+    tokens: list[int],
+    model_name: str,
+    client: Optional[Client] = None,
+) -> str:
+    """
+    # Detokenize a list of LLM tokens into a string.
+    ## Arguments
+    - `tokens`: The input list of tokens.
+    - `model_name`: The model with which to detokenize the input text.
+    - `client`: The Client with which to connect to Octostar. If None, the default one is used.
+    ## Returns
+    The detokenized string.
+    ## Raises
+    - `ApiConnectionError`: If the query was unsuccessful.
+    """
+    if not client:
+        client = get_default_client()
+    response = None
+    try:
+        for attempt in network_retry_strategy(retries=3):
+            with attempt:
+                async with httpx.AsyncClient() as httpx_client:
+                    response = await httpx_client.post(
+                        **_prepare_detokenize_request(client, tokens, model_name)
+                    )
+                    response.raise_for_status()
+                try:
+                    response = response.json()["text"]
+                except Exception as e:
+                    raise ConnectionError(
+                        f"Unparsable response format {response.content} with exception {e}"
+                    )
+    except Exception:
+        raise ApiConnectionError("detokenize", response, client)
+    return response  # pyright: ignore[reportReturnType]

octostar/utils/chat/get_default_model.py ADDED Viewed

@@ -0,0 +1,50 @@
+from typing import Optional
+from ...client import Client
+from . import list_models
+def _get_default_model_from_list(models):
+    default_model = list(filter(lambda x: x.get("is_default") == True, models))
+    if len(default_model) != 1:
+        raise ValueError(f"Found {len(default_model)} default models instead of 1")
+    return default_model[0]
+def sync(
+    client: Optional[Client] = None,
+) -> dict:
+    """
+    # Get the current default AI chat model.
+    ## Arguments
+    - `client`: The Client with which to connect to Octostar. If None, the default one is used.
+    ## Returns
+    The information about the default AI model.
+    ## Raises
+    - `ApiConnectionError`: If the query was unsuccessful.
+    - `ValueError`: If no default model is available.
+    """
+    models = list_models.sync(client=client)
+    return _get_default_model_from_list(models)
+async def asyncio(
+    client: Optional[Client] = None,
+) -> dict:
+    """
+    # Get asynchronously the current default AI chat model.
+    ## Arguments
+    - `client`: The Client with which to connect to Octostar. If None, the default one is used.
+    ## Returns
+    The information about the default AI model.
+    ## Raises
+    - `ApiConnectionError`: If the query was unsuccessful.
+    - `ValueError`: If no default model is available.
+    """
+    models = await list_models.asyncio(client=client)
+    return _get_default_model_from_list(models)