PyPI - docent-python - Versions diffs - 0.1.25a0__py3-none-any.whl → 0.1.26a0__py3-none-any.whl - Mend

docent-python 0.1.25a0py3-none-any.whl → 0.1.26a0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (7) hide show

docent/_llm_util/data_models/llm_output.py CHANGED Viewed

@@ -8,6 +8,7 @@ from pydantic import BaseModel
 from docent._llm_util.data_models.exceptions import (
     LLM_ERROR_TYPES,
     CompletionTooLongException,
+    ContextWindowException,
     LLMException,
 )
 from docent._log_util import get_logger
@@ -148,6 +149,13 @@ class LLMOutput:
     def from_dict(cls, data: dict[str, Any]) -> "LLMOutput":
         error_type_map = {e.error_type_id: e for e in LLM_ERROR_TYPES}
         errors = data.get("errors", [])
+        error_types_to_not_log: list[str] = [
+            CompletionTooLongException.error_type_id,
+            ContextWindowException.error_type_id,
+        ]
+        errors_to_log = [e for e in errors if e not in error_types_to_not_log]
+        if errors_to_log:
+            logger.error(f"Loading LLM output with errors: {errors}")
         errors = [error_type_map.get(e, LLMException)() for e in errors]
         completions = data.get("completions", [])

docent/_llm_util/llm_svc.py CHANGED Viewed

@@ -176,7 +176,7 @@ async def _parallelize_calls(
                         )
                         if retry_count >= MAX_VALIDATION_ATTEMPTS:
                             logger.error(
-                                f"Validation failed for {model_name} after {MAX_VALIDATION_ATTEMPTS} attempts: {e}"
+                                f"Validation failed for {model_name} after {retry_count} attempts. Original output: {e.failed_output}"
                             )
                             result = LLMOutput(
                                 model=model_name,
@@ -195,8 +195,8 @@ async def _parallelize_calls(
                         break
                     except Exception as e:
                         if not isinstance(e, LLMException):
-                            logger.warning(
-                                f"LLM call raised an exception that is not an LLMException: {e}"
+                            logger.error(
+                                f"LLM call raised an exception that is not an LLMException: {e}. Failure traceback:\n{traceback.format_exc()}"
                             )
                             llm_exception = LLMException(e)
                             llm_exception.__cause__ = e

docent/trace.py CHANGED Viewed

@@ -1,12 +1,15 @@
+import asyncio
 import atexit
 import contextvars
 import itertools
+import json
 import logging
 import os
 import sys
 import threading
 import uuid
 from collections import defaultdict
+from concurrent.futures import Future, ThreadPoolExecutor
 from contextlib import asynccontextmanager, contextmanager
 from contextvars import ContextVar, Token
 from datetime import datetime, timezone
@@ -132,6 +135,10 @@ class DocentTracer:
         self._transcript_group_states: dict[str, dict[str, Optional[str]]] = {}
         self._transcript_group_state_lock = threading.Lock()
         self._flush_lock = threading.Lock()
+        self._http_executor: Optional[ThreadPoolExecutor] = None
+        self._http_executor_lock = threading.Lock()
+        self._pending_http_futures: Set[Future[Any]] = set()
+        self._pending_http_lock = threading.Lock()
     def get_current_agent_run_id(self) -> Optional[str]:
         """
@@ -441,6 +448,12 @@ class DocentTracer:
         try:
             self.flush()
+            if self._http_executor:
+                self._http_executor.shutdown(wait=True)
+                self._http_executor = None
+            with self._pending_http_lock:
+                self._pending_http_futures.clear()
             if self._tracer_provider:
                 self._tracer_provider.shutdown()
                 self._tracer_provider = None
@@ -471,6 +484,7 @@ class DocentTracer:
                 if hasattr(processor, "force_flush"):
                     logger.debug(f"Flushing span processor {i}")
                     processor.force_flush(timeout_millis=50)
+            self._wait_for_http_requests()
             logger.debug("Span flush completed")
         except Exception as e:
             logger.error(f"Error during flush: {e}")
@@ -617,7 +631,66 @@ class DocentTracer:
         return headers
-    def _post_json(self, path: str, data: Dict[str, Any]) -> None:
+    def _get_http_executor(self) -> ThreadPoolExecutor:
+        with self._http_executor_lock:
+            if self._http_executor is None:
+                self._http_executor = ThreadPoolExecutor(
+                    max_workers=4, thread_name_prefix="docent-http"
+                )
+            return self._http_executor
+    def _should_run_http_in_background(self) -> bool:
+        try:
+            loop = asyncio.get_running_loop()
+        except RuntimeError:
+            return False
+        return loop.is_running()
+    def _on_http_future_done(self, future: Future[Any]) -> None:
+        with self._pending_http_lock:
+            self._pending_http_futures.discard(future)
+        try:
+            future.result()
+        except Exception as exc:  # pragma: no cover - defensive logging
+            logger.error(f"Background HTTP request failed: {exc}")
+    def _schedule_background_post(self, task: Callable[[], None]) -> None:
+        executor = self._get_http_executor()
+        future = executor.submit(task)
+        with self._pending_http_lock:
+            self._pending_http_futures.add(future)
+        future.add_done_callback(self._on_http_future_done)
+    def _wait_for_http_requests(self) -> None:
+        while True:
+            with self._pending_http_lock:
+                pending = list(self._pending_http_futures)
+            if not pending:
+                break
+            for future in pending:
+                try:
+                    future.result()
+                except Exception as exc:  # pragma: no cover - defensive logging
+                    logger.error(f"Background HTTP request failed: {exc}")
+    def _ensure_json_serializable_metadata(self, metadata: Dict[str, Any], context: str) -> None:
+        """
+        Validate that metadata can be serialized to JSON before sending it to the backend.
+        """
+        try:
+            json.dumps(metadata)
+        except (TypeError, ValueError) as exc:
+            raise TypeError(f"{context} metadata must be JSON serializable") from exc
+    def _post_json(
+        self, path: str, data: Dict[str, Any], *, allow_background: bool = False
+    ) -> None:
+        if allow_background and self._should_run_http_in_background():
+            self._schedule_background_post(lambda: self._post_json_sync(path, data))
+            return
+        self._post_json_sync(path, data)
+    def _post_json_sync(self, path: str, data: Dict[str, Any]) -> None:
         if not self._api_endpoint_base:
             raise RuntimeError("API endpoint base is not configured")
         url = f"{self._api_endpoint_base}{path}"
@@ -662,6 +735,8 @@ class DocentTracer:
         if self._disabled:
             return
+        self._ensure_json_serializable_metadata(metadata, "Agent run")
         collection_id = self.collection_id
         payload: Dict[str, Any] = {
             "collection_id": collection_id,
@@ -669,7 +744,7 @@ class DocentTracer:
             "metadata": metadata,
             "timestamp": datetime.now(timezone.utc).isoformat(),
         }
-        self._post_json("/v1/agent-run-metadata", payload)
+        self._post_json("/v1/agent-run-metadata", payload, allow_background=True)
     def send_transcript_metadata(
         self,
@@ -707,6 +782,7 @@ class DocentTracer:
         if transcript_group_id is not None:
             payload["transcript_group_id"] = transcript_group_id
         if metadata is not None:
+            self._ensure_json_serializable_metadata(metadata, "Transcript")
             payload["metadata"] = metadata
         self._post_json("/v1/transcript-metadata", payload)
@@ -925,6 +1001,7 @@ class DocentTracer:
         if final_parent_transcript_group_id is not None:
             payload["parent_transcript_group_id"] = final_parent_transcript_group_id
         if metadata is not None:
+            self._ensure_json_serializable_metadata(metadata, "Transcript group")
             payload["metadata"] = metadata
         self._post_json("/v1/transcript-group-metadata", payload)

{docent_python-0.1.25a0.dist-info → docent_python-0.1.26a0.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: docent-python
-Version: 0.1.25a0
+Version: 0.1.26a0
 Summary: Docent SDK
 Project-URL: Homepage, https://github.com/TransluceAI/docent
 Project-URL: Issues, https://github.com/TransluceAI/docent/issues

{docent_python-0.1.25a0.dist-info → docent_python-0.1.26a0.dist-info}/RECORD RENAMED Viewed

@@ -1,14 +1,14 @@
 docent/__init__.py,sha256=fuhETwJPcesiB76Zxa64HBJxeaaTyRalIH-fs77TWsU,112
 docent/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-docent/trace.py,sha256=loJJDD3AX-rrP-QsZ8WkkFPxKd4u9wiiBG0gtxSgY0I,69743
+docent/trace.py,sha256=3Z6xy4ZsP5S1_xrN6luwSsHfZlQL94qLZazJ3v-fzxQ,72953
 docent/trace_temp.py,sha256=Z0lAPwVzXjFvxpiU-CuvfWIslq9Q4alNkZMoQ77Xudk,40711
 docent/_llm_util/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 docent/_llm_util/llm_cache.py,sha256=nGrvfFikFbEnfmzZRvWvZ60gfVSTvW1iC8-ciCXwbAk,6430
-docent/_llm_util/llm_svc.py,sha256=PQ-96UDJrnPa9csTKL_JDO8jzOrLzysVBqUHywuij0w,18046
+docent/_llm_util/llm_svc.py,sha256=WbLx8F0BfToL0PUIUKNWVwjAoGPE3AUCbVJLBIWTeWA,18109
 docent/_llm_util/model_registry.py,sha256=8Y4VwrA2f2EX78cG1VBIBHVvT_p4qqBTdu9a9zJpfTo,3382
 docent/_llm_util/data_models/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 docent/_llm_util/data_models/exceptions.py,sha256=IW4BVMVp8r5TufNXyrhy3acgwJiQQQPQjB9VA4RVXw8,1489
-docent/_llm_util/data_models/llm_output.py,sha256=ZAIIcgfxMZtTft8bXTPAhUcXEO48GLG3epkul_4gQNQ,10239
+docent/_llm_util/data_models/llm_output.py,sha256=UCYewoXN72skigN_fm414TzQol1KxmVbQGwgGVROE_4,10602
 docent/_llm_util/providers/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 docent/_llm_util/providers/anthropic.py,sha256=-1oPd5FB4aFwKSmNvXzG8PVewjhgsogLRX1SCpnCxoA,18720
 docent/_llm_util/providers/common.py,sha256=dgcTuU4XkCKoAaM48UW8zMgRYUzj7TDBhvWqtnxBO7g,1166
@@ -53,7 +53,7 @@ docent/samples/tb_airline.json,sha256=eR2jFFRtOw06xqbEglh6-dPewjifOk-cuxJq67Dtu5
 docent/sdk/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 docent/sdk/agent_run_writer.py,sha256=0AWdxejoqZyuj9JSA39WlEwGcMSYTWNqnzIuluySY-M,11043
 docent/sdk/client.py,sha256=aB_ILmzzK9JAC2kobtnp50stfINpSfNh54siaDlMEKc,19880
-docent_python-0.1.25a0.dist-info/METADATA,sha256=kBFVQJ-HqomY9dG6wd3xCw9OyC5gRP7Gz3ZIQHpqq0c,1351
-docent_python-0.1.25a0.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
-docent_python-0.1.25a0.dist-info/licenses/LICENSE.md,sha256=QIMv2UiT6MppRasso4ymaA0w7ltkqmlL0HCt8CLD7Rc,580
-docent_python-0.1.25a0.dist-info/RECORD,,
+docent_python-0.1.26a0.dist-info/METADATA,sha256=TWwg2-VbK4CCWDDx36P4tnbExZw7ljYGoVMhWqfofZk,1351
+docent_python-0.1.26a0.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
+docent_python-0.1.26a0.dist-info/licenses/LICENSE.md,sha256=QIMv2UiT6MppRasso4ymaA0w7ltkqmlL0HCt8CLD7Rc,580
+docent_python-0.1.26a0.dist-info/RECORD,,

{docent_python-0.1.25a0.dist-info → docent_python-0.1.26a0.dist-info}/WHEEL RENAMED Viewed

File without changes

{docent_python-0.1.25a0.dist-info → docent_python-0.1.26a0.dist-info}/licenses/LICENSE.md RENAMED Viewed

File without changes

docent-python 0.1.25a0__py3-none-any.whl → 0.1.26a0__py3-none-any.whl

docent-python 0.1.25a0py3-none-any.whl → 0.1.26a0py3-none-any.whl