PyPI - haiku.rag-slim - Versions diffs - 0.16.0__py3-none-any.whl → 0.24.0__py3-none-any.whl - Mend

haiku.rag-slim 0.16.0py3-none-any.whl → 0.24.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of haiku.rag-slim might be problematic. Click here for more details.

Files changed (94) hide show

haiku/rag/app.py +430 -72
haiku/rag/chunkers/__init__.py +31 -0
haiku/rag/chunkers/base.py +31 -0
haiku/rag/chunkers/docling_local.py +164 -0
haiku/rag/chunkers/docling_serve.py +179 -0
haiku/rag/cli.py +207 -24
haiku/rag/cli_chat.py +489 -0
haiku/rag/client.py +1251 -266
haiku/rag/config/__init__.py +16 -10
haiku/rag/config/loader.py +5 -44
haiku/rag/config/models.py +126 -17
haiku/rag/converters/__init__.py +31 -0
haiku/rag/converters/base.py +63 -0
haiku/rag/converters/docling_local.py +193 -0
haiku/rag/converters/docling_serve.py +229 -0
haiku/rag/converters/text_utils.py +237 -0
haiku/rag/embeddings/__init__.py +123 -24
haiku/rag/embeddings/voyageai.py +175 -20
haiku/rag/graph/__init__.py +0 -11
haiku/rag/graph/agui/__init__.py +8 -2
haiku/rag/graph/agui/cli_renderer.py +1 -1
haiku/rag/graph/agui/emitter.py +219 -31
haiku/rag/graph/agui/server.py +20 -62
haiku/rag/graph/agui/stream.py +1 -2
haiku/rag/graph/research/__init__.py +5 -2
haiku/rag/graph/research/dependencies.py +12 -126
haiku/rag/graph/research/graph.py +390 -135
haiku/rag/graph/research/models.py +91 -112
haiku/rag/graph/research/prompts.py +99 -91
haiku/rag/graph/research/state.py +35 -27
haiku/rag/inspector/__init__.py +8 -0
haiku/rag/inspector/app.py +259 -0
haiku/rag/inspector/widgets/__init__.py +6 -0
haiku/rag/inspector/widgets/chunk_list.py +100 -0
haiku/rag/inspector/widgets/context_modal.py +89 -0
haiku/rag/inspector/widgets/detail_view.py +130 -0
haiku/rag/inspector/widgets/document_list.py +75 -0
haiku/rag/inspector/widgets/info_modal.py +209 -0
haiku/rag/inspector/widgets/search_modal.py +183 -0
haiku/rag/inspector/widgets/visual_modal.py +126 -0
haiku/rag/mcp.py +106 -102
haiku/rag/monitor.py +33 -9
haiku/rag/providers/__init__.py +5 -0
haiku/rag/providers/docling_serve.py +108 -0
haiku/rag/qa/__init__.py +12 -10
haiku/rag/qa/agent.py +43 -61
haiku/rag/qa/prompts.py +35 -57
haiku/rag/reranking/__init__.py +9 -6
haiku/rag/reranking/base.py +1 -1
haiku/rag/reranking/cohere.py +5 -4
haiku/rag/reranking/mxbai.py +5 -2
haiku/rag/reranking/vllm.py +3 -4
haiku/rag/reranking/zeroentropy.py +6 -5
haiku/rag/store/__init__.py +2 -1
haiku/rag/store/engine.py +242 -42
haiku/rag/store/exceptions.py +4 -0
haiku/rag/store/models/__init__.py +8 -2
haiku/rag/store/models/chunk.py +190 -0
haiku/rag/store/models/document.py +46 -0
haiku/rag/store/repositories/chunk.py +141 -121
haiku/rag/store/repositories/document.py +25 -84
haiku/rag/store/repositories/settings.py +11 -14
haiku/rag/store/upgrades/__init__.py +19 -3
haiku/rag/store/upgrades/v0_10_1.py +1 -1
haiku/rag/store/upgrades/v0_19_6.py +65 -0
haiku/rag/store/upgrades/v0_20_0.py +68 -0
haiku/rag/store/upgrades/v0_23_1.py +100 -0
haiku/rag/store/upgrades/v0_9_3.py +3 -3
haiku/rag/utils.py +371 -146
{haiku_rag_slim-0.16.0.dist-info → haiku_rag_slim-0.24.0.dist-info}/METADATA +15 -12
haiku_rag_slim-0.24.0.dist-info/RECORD +78 -0
{haiku_rag_slim-0.16.0.dist-info → haiku_rag_slim-0.24.0.dist-info}/WHEEL +1 -1
haiku/rag/chunker.py +0 -65
haiku/rag/embeddings/base.py +0 -25
haiku/rag/embeddings/ollama.py +0 -28
haiku/rag/embeddings/openai.py +0 -26
haiku/rag/embeddings/vllm.py +0 -29
haiku/rag/graph/agui/events.py +0 -254
haiku/rag/graph/common/__init__.py +0 -5
haiku/rag/graph/common/models.py +0 -42
haiku/rag/graph/common/nodes.py +0 -265
haiku/rag/graph/common/prompts.py +0 -46
haiku/rag/graph/common/utils.py +0 -44
haiku/rag/graph/deep_qa/__init__.py +0 -1
haiku/rag/graph/deep_qa/dependencies.py +0 -27
haiku/rag/graph/deep_qa/graph.py +0 -243
haiku/rag/graph/deep_qa/models.py +0 -20
haiku/rag/graph/deep_qa/prompts.py +0 -59
haiku/rag/graph/deep_qa/state.py +0 -56
haiku/rag/graph/research/common.py +0 -87
haiku/rag/reader.py +0 -135
haiku_rag_slim-0.16.0.dist-info/RECORD +0 -71
{haiku_rag_slim-0.16.0.dist-info → haiku_rag_slim-0.24.0.dist-info}/entry_points.txt +0 -0
{haiku_rag_slim-0.16.0.dist-info → haiku_rag_slim-0.24.0.dist-info}/licenses/LICENSE +0 -0

haiku/rag/graph/agui/server.py CHANGED Viewed

@@ -18,8 +18,7 @@ from starlette.responses import JSONResponse, StreamingResponse
 from starlette.routing import Route
 from haiku.rag.config.models import AGUIConfig
-from haiku.rag.graph.agui.emitter import AGUIEmitter
-from haiku.rag.graph.agui.events import AGUIEvent
+from haiku.rag.graph.agui.emitter import AGUIEmitter, AGUIEvent
 from haiku.rag.graph.agui.stream import stream_graph
@@ -151,23 +150,25 @@ def format_sse_event(event: AGUIEvent) -> str:
     return f"data: {event_json}\n\n"
-def create_agui_server(config: "AppConfig", db_path: Path | None = None) -> Starlette:
-    """Create AG-UI server with both research and deep ask endpoints.
+def create_agui_server(  # pragma: no cover
+    config: "AppConfig", db_path: Path | None = None
+) -> Starlette:
+    """Create AG-UI server with research endpoint.
     Args:
-        config: Application config with research and qa settings
+        config: Application config with research settings
         db_path: Optional database path override
     Returns:
-        Starlette app with research and deep ask endpoints
+        Starlette app with research endpoint
     """
     from haiku.rag.client import HaikuRAG
-    from haiku.rag.graph.deep_qa.dependencies import DeepQAContext
-    from haiku.rag.graph.deep_qa.graph import build_deep_qa_graph
-    from haiku.rag.graph.deep_qa.state import DeepQADeps, DeepQAState
     from haiku.rag.graph.research.dependencies import ResearchContext
     from haiku.rag.graph.research.graph import build_research_graph
-    from haiku.rag.graph.research.state import ResearchDeps, ResearchState
+    from haiku.rag.graph.research.state import (
+        ResearchDeps,
+        ResearchState,
+    )
     # Store client reference for proper lifecycle management
     _client_cache: dict[str, HaikuRAG] = {}
@@ -190,7 +191,14 @@ def create_agui_server(config: "AppConfig", db_path: Path | None = None) -> Star
             if messages:
                 question = messages[0].get("content", "")
         context = ResearchContext(original_question=question)
-        return ResearchState.from_config(context=context, config=config)
+        max_iterations = input_state.get("max_iterations")
+        confidence_threshold = input_state.get("confidence_threshold")
+        return ResearchState.from_config(
+            context=context,
+            config=config,
+            max_iterations=max_iterations,
+            confidence_threshold=confidence_threshold,
+        )
     def research_deps_factory(input_config: dict[str, Any]) -> ResearchDeps:
         effective_db_path = (
@@ -200,29 +208,7 @@ def create_agui_server(config: "AppConfig", db_path: Path | None = None) -> Star
         )
         return ResearchDeps(client=get_client(effective_db_path))
-    # Deep ask graph factories
-    def deep_ask_graph_factory() -> Graph:
-        return build_deep_qa_graph(config)
-    def deep_ask_state_factory(input_state: dict[str, Any]) -> DeepQAState:
-        question = input_state.get("question", "")
-        if not question:
-            messages = input_state.get("messages", [])
-            if messages:
-                question = messages[0].get("content", "")
-        use_citations = input_state.get("use_citations", False)
-        context = DeepQAContext(original_question=question, use_citations=use_citations)
-        return DeepQAState.from_config(context=context, config=config)
-    def deep_ask_deps_factory(input_config: dict[str, Any]) -> DeepQADeps:
-        effective_db_path = (
-            db_path
-            or input_config.get("db_path")
-            or config.storage.data_dir / "haiku.rag.lancedb"
-        )
-        return DeepQADeps(client=get_client(effective_db_path))
-    # Create event stream functions for each graph type
+    # Create event stream function
     async def research_event_stream(
         input_data: RunAgentInput,
     ) -> AsyncIterator[str]:
@@ -235,18 +221,6 @@ def create_agui_server(config: "AppConfig", db_path: Path | None = None) -> Star
             event_data = format_sse_event(event)
             yield event_data
-    async def deep_ask_event_stream(
-        input_data: RunAgentInput,
-    ) -> AsyncIterator[str]:
-        """Generate SSE event stream from deep ask graph execution."""
-        graph = deep_ask_graph_factory()
-        initial_state = deep_ask_state_factory(input_data.state)
-        deps = deep_ask_deps_factory(input_data.config)
-        async for event in stream_graph(graph, initial_state, deps):
-            event_data = format_sse_event(event)
-            yield event_data
     # Endpoint handlers
     async def stream_research(request: Request) -> StreamingResponse:
         """Research graph streaming endpoint."""
@@ -263,21 +237,6 @@ def create_agui_server(config: "AppConfig", db_path: Path | None = None) -> Star
             },
         )
-    async def stream_deep_ask(request: Request) -> StreamingResponse:
-        """Deep ask graph streaming endpoint."""
-        body = await request.json()
-        input_data = RunAgentInput(**body)
-        return StreamingResponse(
-            deep_ask_event_stream(input_data),
-            media_type="text/event-stream",
-            headers={
-                "Cache-Control": "no-cache",
-                "Connection": "keep-alive",
-                "X-Accel-Buffering": "no",
-            },
-        )
     async def health_check(_: Request) -> JSONResponse:
         """Health check endpoint."""
         return JSONResponse({"status": "healthy"})
@@ -285,7 +244,6 @@ def create_agui_server(config: "AppConfig", db_path: Path | None = None) -> Star
     # Define routes
     routes = [
         Route("/v1/research/stream", stream_research, methods=["POST"]),
-        Route("/v1/deep-ask/stream", stream_deep_ask, methods=["POST"]),
         Route("/health", health_check, methods=["GET"]),
     ]

haiku/rag/graph/agui/stream.py CHANGED Viewed

@@ -8,8 +8,7 @@ from typing import Protocol, TypeVar
 from pydantic import BaseModel
 from pydantic_graph.beta import Graph
-from haiku.rag.graph.agui.emitter import AGUIEmitter
-from haiku.rag.graph.agui.events import AGUIEvent
+from haiku.rag.graph.agui.emitter import AGUIEmitter, AGUIEvent
 StateT = TypeVar("StateT", bound=BaseModel)
 ResultT = TypeVar("ResultT")

haiku/rag/graph/research/__init__.py CHANGED Viewed

@@ -1,3 +1,6 @@
-from haiku.rag.graph.common.models import SearchAnswer
 from haiku.rag.graph.research.dependencies import ResearchContext, ResearchDependencies
-from haiku.rag.graph.research.models import EvaluationResult, ResearchReport
+from haiku.rag.graph.research.models import (
+    EvaluationResult,
+    ResearchReport,
+    SearchAnswer,
+)

haiku/rag/graph/research/dependencies.py CHANGED Viewed

@@ -1,14 +1,12 @@
-from collections.abc import Iterable
+from typing import TYPE_CHECKING, Any
-from pydantic import BaseModel, Field, PrivateAttr
+from pydantic import BaseModel, Field
 from haiku.rag.client import HaikuRAG
-from haiku.rag.graph.common.models import SearchAnswer
-from haiku.rag.graph.research.models import (
-    GapRecord,
-    InsightAnalysis,
-    InsightRecord,
-)
+from haiku.rag.store.models import SearchResult
+if TYPE_CHECKING:
+    from haiku.rag.graph.research.models import SearchAnswer
 class ResearchContext(BaseModel):
@@ -18,124 +16,14 @@ class ResearchContext(BaseModel):
     sub_questions: list[str] = Field(
         default_factory=list, description="Decomposed sub-questions"
     )
-    qa_responses: list[SearchAnswer] = Field(
+    qa_responses: list[Any] = Field(
         default_factory=list, description="Structured QA pairs used during research"
     )
-    insights: list[InsightRecord] = Field(
-        default_factory=list, description="Key insights discovered"
-    )
-    gaps: list[GapRecord] = Field(
-        default_factory=list, description="Identified information gaps"
-    )
-    # Private dict indexes for O(1) lookups
-    _insights_by_id: dict[str, InsightRecord] = PrivateAttr(default_factory=dict)
-    _gaps_by_id: dict[str, GapRecord] = PrivateAttr(default_factory=dict)
-    def model_post_init(self, __context: object) -> None:
-        """Build indexes after initialization."""
-        self._insights_by_id = {ins.id: ins for ins in self.insights}
-        self._gaps_by_id = {gap.id: gap for gap in self.gaps}
-    def add_qa_response(self, qa: SearchAnswer) -> None:
-        """Add a structured QA response (minimal context already included)."""
+    def add_qa_response(self, qa: "SearchAnswer") -> None:
+        """Add a structured QA response."""
         self.qa_responses.append(qa)
-    def upsert_insights(self, records: Iterable[InsightRecord]) -> list[InsightRecord]:
-        """Merge one or more insights into the shared context with deduplication."""
-        merged: list[InsightRecord] = []
-        for record in records:
-            candidate = InsightRecord.model_validate(record)
-            existing = self._insights_by_id.get(candidate.id)
-            if existing:
-                # Update existing insight
-                existing.summary = candidate.summary
-                existing.status = candidate.status
-                if candidate.notes:
-                    existing.notes = candidate.notes
-                existing.supporting_sources = _merge_unique(
-                    existing.supporting_sources, candidate.supporting_sources
-                )
-                existing.originating_questions = _merge_unique(
-                    existing.originating_questions, candidate.originating_questions
-                )
-                merged.append(existing)
-            else:
-                # Add new insight
-                new_insight = candidate.model_copy(deep=True)
-                self.insights.append(new_insight)
-                self._insights_by_id[new_insight.id] = new_insight
-                merged.append(new_insight)
-        return merged
-    def upsert_gaps(self, records: Iterable[GapRecord]) -> list[GapRecord]:
-        """Merge one or more gap records into the shared context with deduplication."""
-        merged: list[GapRecord] = []
-        for record in records:
-            candidate = GapRecord.model_validate(record)
-            existing = self._gaps_by_id.get(candidate.id)
-            if existing:
-                # Update existing gap
-                existing.description = candidate.description
-                existing.severity = candidate.severity
-                existing.blocking = candidate.blocking
-                existing.resolved = candidate.resolved
-                if candidate.notes:
-                    existing.notes = candidate.notes
-                existing.supporting_sources = _merge_unique(
-                    existing.supporting_sources, candidate.supporting_sources
-                )
-                existing.resolved_by = _merge_unique(
-                    existing.resolved_by, candidate.resolved_by
-                )
-                merged.append(existing)
-            else:
-                # Add new gap
-                new_gap = candidate.model_copy(deep=True)
-                self.gaps.append(new_gap)
-                self._gaps_by_id[new_gap.id] = new_gap
-                merged.append(new_gap)
-        return merged
-    def mark_gap_resolved(
-        self, identifier: str, resolved_by: Iterable[str] | None = None
-    ) -> GapRecord | None:
-        """Mark a gap as resolved by identifier."""
-        gap = self._gaps_by_id.get(identifier)
-        if gap is None:
-            return None
-        gap.resolved = True
-        gap.blocking = False
-        if resolved_by:
-            gap.resolved_by = _merge_unique(gap.resolved_by, list(resolved_by))
-        return gap
-    def integrate_analysis(self, analysis: InsightAnalysis) -> None:
-        """Apply an analysis result to the shared context."""
-        merged_insights: list[InsightRecord] = []
-        if analysis.highlights:
-            merged_insights = self.upsert_insights(analysis.highlights)
-            analysis.highlights = merged_insights
-        if analysis.gap_assessments:
-            merged_gaps = self.upsert_gaps(analysis.gap_assessments)
-            analysis.gap_assessments = merged_gaps
-        if analysis.resolved_gaps:
-            resolved_by_list = (
-                [ins.id for ins in merged_insights] if merged_insights else None
-            )
-            for resolved in analysis.resolved_gaps:
-                self.mark_gap_resolved(resolved, resolved_by=resolved_by_list)
-        for question in analysis.new_questions:
-            if question not in self.sub_questions:
-                self.sub_questions.append(question)
 class ResearchDependencies(BaseModel):
     """Dependencies for research agents with multi-agent context."""
@@ -144,8 +32,6 @@ class ResearchDependencies(BaseModel):
     client: HaikuRAG = Field(description="RAG client for document operations")
     context: ResearchContext = Field(description="Shared research context")
-def _merge_unique(existing: list[str], incoming: Iterable[str]) -> list[str]:
-    """Merge two iterables preserving order while removing duplicates."""
-    return [k for k in dict.fromkeys([*existing, *incoming]) if k]
+    search_results: list[SearchResult] = Field(
+        default_factory=list, description="Search results for citation resolution"
+    )

haiku.rag-slim 0.16.0__py3-none-any.whl → 0.24.0__py3-none-any.whl

Potentially problematic release.

haiku.rag-slim 0.16.0py3-none-any.whl → 0.24.0py3-none-any.whl