PyPI - vedana-backoffice - Versions diffs - 0.1.0__py3-none-any.whl - Mend

vedana-backoffice 0.1.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (30) hide show

vedana_backoffice/Caddyfile +17 -0
vedana_backoffice/__init__.py +0 -0
vedana_backoffice/components/__init__.py +0 -0
vedana_backoffice/components/etl_graph.py +132 -0
vedana_backoffice/components/ui_chat.py +236 -0
vedana_backoffice/graph/__init__.py +0 -0
vedana_backoffice/graph/build.py +169 -0
vedana_backoffice/pages/__init__.py +0 -0
vedana_backoffice/pages/chat.py +204 -0
vedana_backoffice/pages/etl.py +353 -0
vedana_backoffice/pages/eval.py +1006 -0
vedana_backoffice/pages/jims_thread_list_page.py +894 -0
vedana_backoffice/pages/main_dashboard.py +483 -0
vedana_backoffice/py.typed +0 -0
vedana_backoffice/start_services.py +39 -0
vedana_backoffice/state.py +0 -0
vedana_backoffice/states/__init__.py +0 -0
vedana_backoffice/states/chat.py +368 -0
vedana_backoffice/states/common.py +66 -0
vedana_backoffice/states/etl.py +1590 -0
vedana_backoffice/states/eval.py +1940 -0
vedana_backoffice/states/jims.py +508 -0
vedana_backoffice/states/main_dashboard.py +757 -0
vedana_backoffice/ui.py +115 -0
vedana_backoffice/util.py +71 -0
vedana_backoffice/vedana_backoffice.py +23 -0
vedana_backoffice-0.1.0.dist-info/METADATA +10 -0
vedana_backoffice-0.1.0.dist-info/RECORD +30 -0
vedana_backoffice-0.1.0.dist-info/WHEEL +4 -0
vedana_backoffice-0.1.0.dist-info/entry_points.txt +2 -0

vedana_backoffice/states/chat.py ADDED Viewed

@@ -0,0 +1,368 @@
+import asyncio
+import logging
+import os
+import traceback
+from datetime import datetime
+from typing import Any, Dict, Iterable, Tuple
+from uuid import UUID, uuid4
+import orjson as json
+import reflex as rx
+import requests
+from datapipe.compute import Catalog, run_pipeline
+from jims_core.llms.llm_provider import env_settings as llm_settings
+from jims_core.thread.thread_controller import ThreadController
+from jims_core.util import uuid7
+from vedana_core.settings import settings as core_settings
+from vedana_etl.app import app as etl_app
+from vedana_etl.pipeline import get_data_model_pipeline
+from vedana_backoffice.states.common import MemLogger, get_vedana_app
+from vedana_backoffice.states.jims import ThreadViewState
+class ChatState(rx.State):
+    """Minimal chatbot with per-answer technical details."""
+    input_text: str = ""
+    is_running: bool = False
+    messages: list[dict[str, Any]] = []
+    chat_thread_id: str = ""
+    data_model_text: str = ""
+    is_refreshing_dm: bool = False
+    provider: str = "openai"  # default llm provider
+    model: str = core_settings.model
+    _default_models: tuple[str, ...] = (
+        "gpt-5.1-chat-latest",
+        "gpt-5.1",
+        "gpt-5-chat-latest",
+        "gpt-5",
+        "gpt-5-mini",
+        "gpt-5-nano",
+        "gpt-4.1",
+        "gpt-4.1-mini",
+        "gpt-4.1-nano",
+        "gpt-4o",
+        "gpt-4o-mini",
+        "o4-mini",
+    )
+    custom_openrouter_key: str = ""
+    default_openrouter_key_present: bool = bool(os.environ.get("OPENROUTER_API_KEY"))  # to require api_key input
+    openai_models: list[str] = list(set(list(_default_models) + [core_settings.model]))
+    openrouter_models: list[str] = []
+    available_models: list[str] = list(set(list(_default_models) + [core_settings.model]))
+    enable_dm_filtering: bool = bool(os.environ.get("ENABLE_DM_FILTERING", False))
+    async def mount(self) -> None:
+        self.fetch_openrouter_models()
+        self._sync_available_models()
+    def set_input(self, value: str) -> None:
+        self.input_text = value
+    def set_model(self, value: str) -> None:
+        if value in self.available_models:
+            self.model = value
+    def set_custom_openrouter_key(self, value: str) -> None:
+        self.custom_openrouter_key = value  # need validating?
+    def set_enable_dm_filtering(self, value: bool) -> None:
+        self.enable_dm_filtering = value
+    def set_provider(self, value: str) -> None:
+        self.provider = value
+        self._sync_available_models()
+    def _filter_chat_capable(self, models: Iterable[dict]) -> list[str]:
+        result: list[str] = []
+        for m in models:
+            model_id = str(m.get("id", "")).strip()
+            if not model_id:
+                continue
+            has_chat = False
+            architecture = m.get("architecture", {})
+            if architecture:
+                if "text" in architecture.get("input_modalities", []) and "text" in architecture.get(
+                    "output_modalities", []
+                ):
+                    has_chat = True
+            has_tools = False  # only accept models with tool calls
+            if "tools" in m.get("supported_parameters", []):
+                has_tools = True
+            if has_chat and has_tools:
+                result.append(model_id)
+        return result
+    def fetch_openrouter_models(self) -> None:
+        try:
+            resp = requests.get(
+                f"{llm_settings.openrouter_api_base_url}/models",
+                # headers={"Authorization": f"Bearer {openrouter_api_key}"},  # actually works without a token as well
+                timeout=10,
+            )
+            resp.raise_for_status()
+            payload = resp.json()
+            models = payload.get("data", [])
+            parsed = self._filter_chat_capable(models)
+        except Exception as exc:  # pragma: no cover - best effort
+            logging.warning(f"Failed to fetch OpenRouter models: {exc}")
+            parsed = []
+        self.openrouter_models = sorted(list(parsed))
+    def _sync_available_models(self) -> None:
+        """
+        Recompute available_models based on selected provider, and realign
+        the selected model if it is no longer valid.
+        """
+        if self.provider == "openrouter":
+            models = self.openrouter_models
+            if not models:
+                self.provider = "openai"
+                models = self.openai_models
+        else:
+            models = self.openai_models
+        self.available_models = list(models)
+        if self.model not in self.available_models and self.available_models:
+            self.model = self.available_models[0]
+    def toggle_details_by_id(self, message_id: str) -> None:
+        for idx, m in enumerate(self.messages):
+            if str(m.get("id")) == str(message_id):
+                msg = dict(m)
+                msg["show_details"] = not bool(msg.get("show_details"))
+                self.messages[idx] = msg
+                break
+    def reset_session(self) -> None:
+        """Clear current chat history and start a fresh session (new thread on next send)."""
+        self.messages = []
+        self.input_text = ""
+        self.chat_thread_id = ""
+    @rx.var
+    def total_conversation_cost(self) -> float:
+        """Calculate total cost by summing requests_cost from all assistant messages."""
+        total = 0.0
+        for msg in self.messages:
+            if msg.get("is_assistant") and msg.get("model_stats"):
+                model_stats = msg.get("model_stats", {})
+                if isinstance(model_stats, dict):
+                    # model_stats can be {model_name: {requests_cost: value, ...}}
+                    for model_name, stats in model_stats.items():
+                        if isinstance(stats, dict):
+                            cost = stats.get("requests_cost")
+                            if cost is not None:
+                                try:
+                                    total += float(cost)
+                                except (ValueError, TypeError):
+                                    pass
+        return total
+    @rx.var
+    def total_conversation_cost_str(self) -> str:
+        """Formatted string representation of total conversation cost."""
+        cost = self.total_conversation_cost
+        if cost > 0:
+            return f"${cost:.6f}"
+        return ""
+    def _append_message(
+        self,
+        role: str,
+        content: str,
+        technical_info: dict[str, Any] | None = None,
+        debug_logs: str | None = None,
+    ) -> None:
+        message: dict[str, Any] = {
+            "id": str(uuid4()),
+            "role": role,
+            "content": content,
+            "created_at": datetime.now().strftime("%Y-%m-%d %H:%M"),
+            "is_assistant": role == "assistant",
+            "has_tech": False,
+            "show_details": False,
+            "tags": [],
+            "comments": [],
+        }
+        if technical_info:
+            vts_list = [str(x) for x in technical_info.get("vts_queries") or []]
+            cypher_list = [str(x) for x in technical_info.get("cypher_queries") or []]
+            models_raw = technical_info.get("model_stats", {})
+            model_pairs: list[tuple[str, str]] = []
+            if isinstance(models_raw, dict):
+                for mk, mv in models_raw.items():
+                    try:
+                        model_pairs.append((str(mk), json.dumps(mv).decode()))
+                    except Exception:
+                        model_pairs.append((str(mk), str(mv)))
+            models_list = [f"{k}: {v}" for k, v in model_pairs]
+            message["vts_str"] = "\n".join(vts_list)
+            message["cypher_str"] = "\n".join(cypher_list)
+            message["models_str"] = "\n".join(models_list)
+            message["has_vts"] = bool(vts_list)
+            message["has_cypher"] = bool(cypher_list)
+            message["has_models"] = bool(models_list)
+            message["has_tech"] = bool(vts_list or cypher_list or models_list)
+            message["model_stats"] = models_raw
+        logs = (debug_logs or "").replace("\r\n", "\n").rstrip()
+        message["logs_str"] = logs
+        message["has_logs"] = bool(logs)
+        self.messages.append(message)
+    async def _ensure_thread(self) -> str:
+        vedana_app = await get_vedana_app()
+        try:
+            existing = await ThreadController.from_thread_id(vedana_app.sessionmaker, UUID(self.chat_thread_id))
+        except Exception:
+            existing = None
+        if existing is None:
+            thread_id = uuid7()
+            ctl = await ThreadController.new_thread(
+                vedana_app.sessionmaker,
+                contact_id=f"reflex:{thread_id}",
+                thread_id=thread_id,
+                thread_config={"interface": "reflex"},
+            )
+            return str(ctl.thread.thread_id)
+        return self.chat_thread_id
+    async def _run_message(self, thread_id: str, user_text: str) -> Tuple[str, Dict[str, Any], str]:
+        vedana_app = await get_vedana_app()
+        try:
+            tid = UUID(thread_id)
+        except Exception:
+            tid = uuid7()
+        ctl = await ThreadController.from_thread_id(vedana_app.sessionmaker, tid)
+        if ctl is None:
+            thr_id = uuid7()
+            ctl = await ThreadController.new_thread(
+                vedana_app.sessionmaker,
+                contact_id=f"reflex:{thr_id}",
+                thread_id=thr_id,
+                thread_config={"interface": "reflex"},
+            )
+        mem_logger = MemLogger("rag_debug", level=logging.DEBUG)
+        await ctl.store_user_message(uuid7(), user_text)
+        pipeline = vedana_app.pipeline
+        pipeline.logger = mem_logger
+        pipeline.model = f"{self.provider}/{self.model}"
+        pipeline.enable_filtering = self.enable_dm_filtering
+        ctx = await ctl.make_context()
+        # override model api_key if custom api_key is provided
+        if self.custom_openrouter_key and self.provider == "openrouter":
+            ctx.llm.model_api_key = self.custom_openrouter_key
+            # embeddings model is not customisable in chat, it's configured on project level.
+        events = await ctl.run_pipeline_with_context(pipeline, ctx)
+        answer: str = ""
+        tech: dict[str, Any] = {}
+        for ev in events:
+            if ev.event_type == "comm.assistant_message":
+                answer = str(ev.event_data.get("content", ""))
+            elif ev.event_type == "rag.query_processed":
+                tech = dict(ev.event_data.get("technical_info", {}))
+        logs = mem_logger.get_logs()
+        return answer, tech, logs
+    # mypy raises error: "EventNamespace" not callable [operator], though event definition is according to reflex docs
+    @rx.event(background=True)  # type: ignore[operator]
+    async def send_background(self, user_text: str):
+        """This runs in background (non-blocking), after send() submission."""
+        # Need context to modify state safely
+        async with self:
+            try:
+                thread_id = await self._ensure_thread()
+                answer, tech, logs = await self._run_message(thread_id, user_text)
+                # update shared session thread id
+                self.chat_thread_id = thread_id
+            except Exception as e:
+                answer, tech, logs = (f"Error: {e}", {}, traceback.format_exc())
+            self._append_message("assistant", answer, technical_info=tech, debug_logs=logs)
+            self.is_running = False
+    def send(self):
+        """form submit / button click"""
+        if self.is_running:
+            return
+        user_text = (self.input_text or "").strip()
+        if not user_text:
+            return
+        self._append_message("user", user_text)
+        self.input_text = ""
+        self.is_running = True
+        yield  # trigger UI update
+        yield ChatState.send_background(user_text)
+    def open_jims_thread(self):
+        """Open the JIMS page and preselect the current chat thread."""
+        if not (self.chat_thread_id or "").strip():
+            return
+        # First set selection on JIMS state, then navigate to /jims
+        yield ThreadViewState.select_thread(thread_id=self.chat_thread_id)  # type: ignore[operator]
+        yield rx.redirect("/jims")  # type: ignore[operator]
+    @rx.event(background=True)  # type: ignore[operator]
+    async def load_data_model_text(self):
+        async with self:
+            va = await get_vedana_app()
+            try:
+                self.data_model_text = await va.data_model.to_text_descr()
+            except Exception:
+                self.data_model_text = "(failed to load data model text)"
+            self.is_refreshing_dm = False  # make the update button available
+            yield
+    def reload_data_model(self):
+        """Connecting button with a background task. Used to trigger animations properly."""
+        if self.is_refreshing_dm:
+            return
+        self.is_refreshing_dm = True
+        yield
+        yield ChatState.reload_data_model_background()
+    @rx.event(background=True)  # type: ignore[operator]
+    async def reload_data_model_background(self):
+        try:
+            """Reload the data model by running all data_model_steps from the pipeline."""
+            await asyncio.to_thread(run_pipeline, etl_app.ds, Catalog({}), get_data_model_pipeline())
+            async with self:
+                va = await get_vedana_app()
+                self.data_model_text = await va.data_model.to_text_descr()
+            yield rx.toast.success("Data model reloaded")
+        except Exception as e:
+            async with self:
+                error_msg = str(e)
+                self.data_model_text = f"(error reloading data model: {error_msg})"
+            yield rx.toast.error(f"Failed to reload data model\n{error_msg}")
+        finally:
+            async with self:
+                self.is_refreshing_dm = False
+            yield

vedana_backoffice/states/common.py ADDED Viewed

@@ -0,0 +1,66 @@
+import io
+import logging
+import os
+import reflex as rx
+import requests
+from vedana_core.app import VedanaApp, make_vedana_app
+vedana_app: VedanaApp | None = None
+EVAL_ENABLED = bool(os.environ.get("GRIST_TEST_SET_DOC_ID"))
+async def get_vedana_app():
+    global vedana_app
+    if vedana_app is None:
+        vedana_app = await make_vedana_app()
+    return vedana_app
+class MemLogger(logging.Logger):
+    """Logger that captures logs to a string buffer for debugging purposes."""
+    def __init__(self, name: str, level: int = 0) -> None:
+        super().__init__(name, level)
+        self.parent = logging.getLogger(__name__)
+        self._buf = io.StringIO()
+        handler = logging.StreamHandler(self._buf)
+        handler.setFormatter(logging.Formatter("%(asctime)s - %(name)s - %(levelname)s - %(message)s"))
+        self.addHandler(handler)
+    def get_logs(self) -> str:
+        return self._buf.getvalue()
+    def clear(self) -> None:
+        self._buf.truncate(0)
+        self._buf.seek(0)
+class AppVersionState(rx.State):
+    version: str = f"`{os.environ.get('VERSION', 'unspecified_version')}`"  # md-formatted
+    eval_enabled: bool = EVAL_ENABLED
+class TelegramBotState(rx.State):
+    """State for Telegram bot information."""
+    bot_username: str = ""
+    bot_url: str = ""
+    has_bot: bool = False
+    def load_bot_info(self) -> None:
+        token = os.environ.get("TELEGRAM_BOT_TOKEN")
+        if not token:
+            return
+        try:
+            bot_status = requests.get(f"https://api.telegram.org/bot{token}/getMe")
+            if bot_status.status_code == 200:
+                bot_status = bot_status.json()
+                if bot_status["ok"]:
+                    self.bot_username = bot_status["result"]["username"]
+                    self.bot_url = f"https://t.me/{self.bot_username}"
+                    self.has_bot = True
+        except Exception as e:
+            logging.warning(f"Failed to load Telegram bot info: {e}")