PyPI - ai-pipeline-core - Versions diffs - 0.3.3__py3-none-any.whl → 0.4.0__py3-none-any.whl - Mend

ai-pipeline-core 0.3.3py3-none-any.whl → 0.4.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (96) hide show

ai_pipeline_core/__init__.py +70 -144
ai_pipeline_core/deployment/__init__.py +6 -18
ai_pipeline_core/deployment/base.py +392 -212
ai_pipeline_core/deployment/contract.py +6 -10
ai_pipeline_core/{utils → deployment}/deploy.py +50 -69
ai_pipeline_core/deployment/helpers.py +16 -17
ai_pipeline_core/{progress.py → deployment/progress.py} +23 -24
ai_pipeline_core/{utils/remote_deployment.py → deployment/remote.py} +11 -14
ai_pipeline_core/docs_generator/__init__.py +54 -0
ai_pipeline_core/docs_generator/__main__.py +5 -0
ai_pipeline_core/docs_generator/cli.py +196 -0
ai_pipeline_core/docs_generator/extractor.py +324 -0
ai_pipeline_core/docs_generator/guide_builder.py +644 -0
ai_pipeline_core/docs_generator/trimmer.py +35 -0
ai_pipeline_core/docs_generator/validator.py +114 -0
ai_pipeline_core/document_store/__init__.py +13 -0
ai_pipeline_core/document_store/_summary.py +9 -0
ai_pipeline_core/document_store/_summary_worker.py +170 -0
ai_pipeline_core/document_store/clickhouse.py +492 -0
ai_pipeline_core/document_store/factory.py +38 -0
ai_pipeline_core/document_store/local.py +312 -0
ai_pipeline_core/document_store/memory.py +85 -0
ai_pipeline_core/document_store/protocol.py +68 -0
ai_pipeline_core/documents/__init__.py +12 -14
ai_pipeline_core/documents/_context_vars.py +85 -0
ai_pipeline_core/documents/_hashing.py +52 -0
ai_pipeline_core/documents/attachment.py +85 -0
ai_pipeline_core/documents/context.py +128 -0
ai_pipeline_core/documents/document.py +318 -1434
ai_pipeline_core/documents/mime_type.py +37 -82
ai_pipeline_core/documents/utils.py +4 -12
ai_pipeline_core/exceptions.py +10 -62
ai_pipeline_core/images/__init__.py +32 -85
ai_pipeline_core/images/_processing.py +5 -11
ai_pipeline_core/llm/__init__.py +6 -4
ai_pipeline_core/llm/ai_messages.py +106 -81
ai_pipeline_core/llm/client.py +267 -158
ai_pipeline_core/llm/model_options.py +12 -84
ai_pipeline_core/llm/model_response.py +53 -99
ai_pipeline_core/llm/model_types.py +8 -23
ai_pipeline_core/logging/__init__.py +2 -7
ai_pipeline_core/logging/logging.yml +1 -1
ai_pipeline_core/logging/logging_config.py +27 -37
ai_pipeline_core/logging/logging_mixin.py +15 -41
ai_pipeline_core/observability/__init__.py +32 -0
ai_pipeline_core/observability/_debug/__init__.py +30 -0
ai_pipeline_core/observability/_debug/_auto_summary.py +94 -0
ai_pipeline_core/{debug/config.py → observability/_debug/_config.py} +11 -7
ai_pipeline_core/{debug/content.py → observability/_debug/_content.py} +134 -75
ai_pipeline_core/{debug/processor.py → observability/_debug/_processor.py} +16 -17
ai_pipeline_core/{debug/summary.py → observability/_debug/_summary.py} +113 -37
ai_pipeline_core/observability/_debug/_types.py +75 -0
ai_pipeline_core/{debug/writer.py → observability/_debug/_writer.py} +126 -196
ai_pipeline_core/observability/_document_tracking.py +146 -0
ai_pipeline_core/observability/_initialization.py +194 -0
ai_pipeline_core/observability/_logging_bridge.py +57 -0
ai_pipeline_core/observability/_summary.py +81 -0
ai_pipeline_core/observability/_tracking/__init__.py +6 -0
ai_pipeline_core/observability/_tracking/_client.py +178 -0
ai_pipeline_core/observability/_tracking/_internal.py +28 -0
ai_pipeline_core/observability/_tracking/_models.py +138 -0
ai_pipeline_core/observability/_tracking/_processor.py +158 -0
ai_pipeline_core/observability/_tracking/_service.py +311 -0
ai_pipeline_core/observability/_tracking/_writer.py +229 -0
ai_pipeline_core/{tracing.py → observability/tracing.py} +139 -335
ai_pipeline_core/pipeline/__init__.py +10 -0
ai_pipeline_core/pipeline/decorators.py +915 -0
ai_pipeline_core/pipeline/options.py +16 -0
ai_pipeline_core/prompt_manager.py +16 -102
ai_pipeline_core/settings.py +26 -31
ai_pipeline_core/testing.py +9 -0
ai_pipeline_core-0.4.0.dist-info/METADATA +807 -0
ai_pipeline_core-0.4.0.dist-info/RECORD +76 -0
ai_pipeline_core/debug/__init__.py +0 -26
ai_pipeline_core/documents/document_list.py +0 -420
ai_pipeline_core/documents/flow_document.py +0 -112
ai_pipeline_core/documents/task_document.py +0 -117
ai_pipeline_core/documents/temporary_document.py +0 -74
ai_pipeline_core/flow/__init__.py +0 -9
ai_pipeline_core/flow/config.py +0 -494
ai_pipeline_core/flow/options.py +0 -75
ai_pipeline_core/pipeline.py +0 -718
ai_pipeline_core/prefect.py +0 -63
ai_pipeline_core/prompt_builder/__init__.py +0 -5
ai_pipeline_core/prompt_builder/documents_prompt.jinja2 +0 -23
ai_pipeline_core/prompt_builder/global_cache.py +0 -78
ai_pipeline_core/prompt_builder/new_core_documents_prompt.jinja2 +0 -6
ai_pipeline_core/prompt_builder/prompt_builder.py +0 -253
ai_pipeline_core/prompt_builder/system_prompt.jinja2 +0 -41
ai_pipeline_core/storage/__init__.py +0 -8
ai_pipeline_core/storage/storage.py +0 -628
ai_pipeline_core/utils/__init__.py +0 -8
ai_pipeline_core-0.3.3.dist-info/METADATA +0 -569
ai_pipeline_core-0.3.3.dist-info/RECORD +0 -57
{ai_pipeline_core-0.3.3.dist-info → ai_pipeline_core-0.4.0.dist-info}/WHEEL +0 -0
{ai_pipeline_core-0.3.3.dist-info → ai_pipeline_core-0.4.0.dist-info}/licenses/LICENSE +0 -0

ai_pipeline_core/logging/logging_mixin.py CHANGED Viewed

@@ -2,9 +2,10 @@
 import contextlib
 import time
+from collections.abc import Generator
 from contextlib import contextmanager
 from functools import cached_property
-from typing import Any, Dict, Generator, Optional
+from typing import Any
 from prefect import get_run_logger
 from prefect.context import FlowRunContext, TaskRunContext
@@ -23,7 +24,7 @@ class LoggerMixin:
     - Internal routing when outside flow/task context
     """
-    _logger_name: Optional[str] = None
+    _logger_name: str | None = None
     @cached_property
     def logger(self):
@@ -32,7 +33,8 @@ class LoggerMixin:
             return logger
         return get_logger(self._logger_name or self.__class__.__module__)
-    def _get_run_logger(self):
+    @staticmethod
+    def _get_run_logger():
         """Attempt to get Prefect run logger.
         Returns:
@@ -56,15 +58,15 @@ class LoggerMixin:
         """Log warning message with optional context."""
         self.logger.warning(message, extra=kwargs)
-    def log_error(self, message: str, exc_info: bool = False, **kwargs: Any) -> None:
+    def log_error(self, message: str, *, exc_info: bool = False, **kwargs: Any) -> None:
         """Log error message with optional exception info."""
         self.logger.error(message, exc_info=exc_info, extra=kwargs)
-    def log_critical(self, message: str, exc_info: bool = False, **kwargs: Any) -> None:
+    def log_critical(self, message: str, *, exc_info: bool = False, **kwargs: Any) -> None:
         """Log critical message with optional exception info."""
         self.logger.critical(message, exc_info=exc_info, extra=kwargs)
-    def log_with_context(self, level: str, message: str, context: Dict[str, Any]) -> None:
+    def log_with_context(self, level: str, message: str, context: dict[str, Any]) -> None:
         """Log message with structured context.
         Args:
@@ -72,12 +74,6 @@ class LoggerMixin:
             message: Log message
             context: Additional context as dictionary
-        Example:
-            self.log_with_context("info", "Processing document", {
-                "document_id": doc.id,
-                "document_size": doc.size,
-                "document_type": doc.type
-            })
         """
         log_method = getattr(self.logger, level.lower(), self.logger.info)
@@ -98,11 +94,6 @@ class StructuredLoggerMixin(LoggerMixin):
             event: Event name
             **kwargs: Event attributes
-        Example:
-            self.log_event("document_processed",
-                          document_id=doc.id,
-                          duration_ms=processing_time,
-                          status="success")
         """
         self.logger.info(event, extra={"event": event, "structured": True, **kwargs})
@@ -115,9 +106,6 @@ class StructuredLoggerMixin(LoggerMixin):
             unit: Unit of measurement
             **tags: Additional tags
-        Example:
-            self.log_metric("processing_time", 1.23, "seconds",
-                          document_type="pdf", model="gpt-5.1")
         """
         self.logger.info(
             f"Metric: {metric_name}",
@@ -138,9 +126,6 @@ class StructuredLoggerMixin(LoggerMixin):
             duration_ms: Duration in milliseconds
             **attributes: Additional attributes
-        Example:
-            self.log_span("llm_generation", 1234.5,
-                         model="gpt-5.1", tokens=500)
         """
         self.logger.info(
             f"Span: {operation}",
@@ -160,9 +145,6 @@ class StructuredLoggerMixin(LoggerMixin):
             operation: Operation name
             **context: Additional context
-        Example:
-            with self.log_operation("document_processing", doc_id=doc.id):
-                process_document(doc)
         """
         start_time = time.perf_counter()
@@ -171,14 +153,12 @@ class StructuredLoggerMixin(LoggerMixin):
         try:
             yield
             duration_ms = (time.perf_counter() - start_time) * 1000
-            self.log_info(
-                f"Completed {operation}", duration_ms=duration_ms, status="success", **context
-            )
+            self.log_info(f"Completed {operation}", duration_ms=duration_ms, status="success", **context)
         except Exception as e:
             # Intentionally broad: Context manager must catch all exceptions to log them
             duration_ms = (time.perf_counter() - start_time) * 1000
             self.log_error(
-                f"Failed {operation}: {str(e)}",
+                f"Failed {operation}: {e!s}",
                 exc_info=True,
                 duration_ms=duration_ms,
                 status="failure",
@@ -190,31 +170,25 @@ class StructuredLoggerMixin(LoggerMixin):
 class PrefectLoggerMixin(StructuredLoggerMixin):
     """Enhanced mixin specifically for Prefect flows and tasks."""
-    def log_flow_start(self, flow_name: str, parameters: Dict[str, Any]) -> None:
+    def log_flow_start(self, flow_name: str, parameters: dict[str, Any]) -> None:
         """Log flow start with parameters."""
         self.log_event("flow_started", flow_name=flow_name, parameters=parameters)
     def log_flow_end(self, flow_name: str, status: str, duration_ms: float) -> None:
         """Log flow completion."""
-        self.log_event(
-            "flow_completed", flow_name=flow_name, status=status, duration_ms=duration_ms
-        )
+        self.log_event("flow_completed", flow_name=flow_name, status=status, duration_ms=duration_ms)
-    def log_task_start(self, task_name: str, inputs: Dict[str, Any]) -> None:
+    def log_task_start(self, task_name: str, inputs: dict[str, Any]) -> None:
         """Log task start with inputs."""
         self.log_event("task_started", task_name=task_name, inputs=inputs)
     def log_task_end(self, task_name: str, status: str, duration_ms: float) -> None:
         """Log task completion."""
-        self.log_event(
-            "task_completed", task_name=task_name, status=status, duration_ms=duration_ms
-        )
+        self.log_event("task_completed", task_name=task_name, status=status, duration_ms=duration_ms)
     def log_retry(self, operation: str, attempt: int, max_attempts: int, error: str) -> None:
         """Log retry attempt."""
-        self.log_warning(
-            f"Retrying {operation}", attempt=attempt, max_attempts=max_attempts, error=error
-        )
+        self.log_warning(f"Retrying {operation}", attempt=attempt, max_attempts=max_attempts, error=error)
     def log_checkpoint(self, checkpoint_name: str, **data: Any) -> None:
         """Log a checkpoint in processing."""

ai_pipeline_core/observability/__init__.py ADDED Viewed

@@ -0,0 +1,32 @@
+"""Observability system for AI pipelines.
+Contains debug tracing, ClickHouse-based tracking, and initialization utilities.
+"""
+from ai_pipeline_core.observability._debug import (
+    ArtifactStore,
+    ContentRef,
+    ContentWriter,
+    LocalDebugSpanProcessor,
+    LocalTraceWriter,
+    SpanInfo,
+    TraceDebugConfig,
+    TraceState,
+    WriteJob,
+    generate_summary,
+)
+from ai_pipeline_core.observability._debug._content import reconstruct_span_content
+__all__ = [
+    "ArtifactStore",
+    "ContentRef",
+    "ContentWriter",
+    "LocalDebugSpanProcessor",
+    "LocalTraceWriter",
+    "SpanInfo",
+    "TraceDebugConfig",
+    "TraceState",
+    "WriteJob",
+    "generate_summary",
+    "reconstruct_span_content",
+]

ai_pipeline_core/observability/_debug/__init__.py ADDED Viewed

@@ -0,0 +1,30 @@
+"""Local trace debugging system for AI pipelines.
+This module provides filesystem-based trace debugging that saves all spans
+with their inputs/outputs for LLM-assisted debugging. Includes static
+summary generation and LLM-powered auto-summary capabilities.
+Enabled automatically in CLI mode (``run_cli``), writing to ``<working_dir>/.trace``.
+Disable with ``--no-trace``.
+"""
+from ._config import TraceDebugConfig
+from ._content import ArtifactStore, ContentRef, ContentWriter, reconstruct_span_content
+from ._processor import LocalDebugSpanProcessor
+from ._summary import generate_summary
+from ._types import SpanInfo, TraceState, WriteJob
+from ._writer import LocalTraceWriter
+__all__ = [
+    "ArtifactStore",
+    "ContentRef",
+    "ContentWriter",
+    "LocalDebugSpanProcessor",
+    "LocalTraceWriter",
+    "SpanInfo",
+    "TraceDebugConfig",
+    "TraceState",
+    "WriteJob",
+    "generate_summary",
+    "reconstruct_span_content",
+]

ai_pipeline_core/observability/_debug/_auto_summary.py ADDED Viewed

@@ -0,0 +1,94 @@
+"""LLM-powered auto-summary generation for trace debugging.
+Separated from _summary.py to avoid circular imports: this module depends on
+ai_pipeline_core.llm, which cannot be imported during the initial package load
+chain that includes _debug/__init__.py.
+"""
+from pydantic import BaseModel, ConfigDict
+from ai_pipeline_core.llm import generate_structured
+from ai_pipeline_core.llm.ai_messages import AIMessages
+from ai_pipeline_core.llm.model_options import ModelOptions
+from ._types import TraceState
+class AutoTraceSummary(BaseModel):
+    """LLM-generated trace analysis."""
+    model_config = ConfigDict(frozen=True)
+    overview: str
+    outcome: str
+    error_analysis: str
+    bottlenecks: tuple[str, ...] = ()
+    cost_assessment: str
+    recommendations: tuple[str, ...] = ()
+async def generate_auto_summary(
+    trace: TraceState,  # noqa: ARG001
+    static_summary: str,
+    model: str,
+) -> str | None:
+    """Generate LLM-powered auto-summary of the trace.
+    Args:
+        trace: Completed trace state with all span data.
+        static_summary: Pre-generated static summary text used as LLM input context.
+        model: LLM model name for summary generation.
+    Returns:
+        Formatted markdown auto-summary string, or None if generation fails.
+    """
+    messages = AIMessages()
+    messages.append(static_summary)
+    options = ModelOptions(
+        system_prompt=(
+            "You are analyzing an AI pipeline execution trace. "
+            "Provide concise, actionable analysis based on the execution data. "
+            "Focus on cost efficiency, performance bottlenecks, and errors."
+        ),
+    )
+    result = await generate_structured(
+        model=model,
+        response_format=AutoTraceSummary,
+        messages=messages,
+        options=options,
+        purpose="trace_auto_summary",
+    )
+    if not result or not result.parsed:
+        return None
+    summary = result.parsed
+    lines = [
+        "# Auto-Summary (LLM-Generated)",
+        "",
+        f"**Overview:** {summary.overview}",
+        "",
+        f"**Outcome:** {summary.outcome}",
+        "",
+    ]
+    if summary.error_analysis:
+        lines.append(f"**Error Analysis:** {summary.error_analysis}")
+        lines.append("")
+    if summary.bottlenecks:
+        lines.append("**Bottlenecks:**")
+        lines.extend(f"- {b}" for b in summary.bottlenecks)
+        lines.append("")
+    lines.append(f"**Cost Assessment:** {summary.cost_assessment}")
+    lines.append("")
+    if summary.recommendations:
+        lines.append("**Recommendations:**")
+        lines.extend(f"- {r}" for r in summary.recommendations)
+        lines.append("")
+    return "\n".join(lines)

ai_pipeline_core/{debug/config.py → observability/_debug/_config.py} RENAMED Viewed

@@ -9,7 +9,7 @@ class TraceDebugConfig(BaseModel):
     """Configuration for local trace debugging.
     Controls how traces are written to the local filesystem for debugging.
-    Enable by setting TRACE_DEBUG_PATH environment variable.
+    Enabled automatically in CLI mode, writing to ``<working_dir>/.trace``.
     """
     model_config = ConfigDict(frozen=True)
@@ -47,12 +47,6 @@ class TraceDebugConfig(BaseModel):
         description="Merge Prefect wrapper spans with inner traced function spans",
     )
-    # Events (Issue #12)
-    events_file_mode: str = Field(
-        default="errors_only",
-        description="When to write events.yaml: 'all', 'errors_only', 'none'",
-    )
     # Indexes (Issue #1)
     include_llm_index: bool = Field(
         default=True,
@@ -89,3 +83,13 @@ class TraceDebugConfig(BaseModel):
     # Summary
     generate_summary: bool = Field(default=True, description="Generate _summary.md")
+    # Auto-summary (LLM-powered)
+    auto_summary_enabled: bool = Field(
+        default=False,
+        description="Generate LLM-powered auto-summary after trace completion",
+    )
+    auto_summary_model: str = Field(
+        default="gemini-3-flash",
+        description="Model to use for auto-summary generation",
+    )

ai-pipeline-core 0.3.3__py3-none-any.whl → 0.4.0__py3-none-any.whl

ai-pipeline-core 0.3.3py3-none-any.whl → 0.4.0py3-none-any.whl