PyPI - mfs-server - Versions diffs - 0.4.0__py3-none-any.whl - Mend

mfs-server 0.4.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (110) hide show

mfs_server/__init__.py +0 -0
mfs_server/api/__init__.py +0 -0
mfs_server/api/app.py +645 -0
mfs_server/api/models.py +224 -0
mfs_server/common/__init__.py +0 -0
mfs_server/common/accel.py +125 -0
mfs_server/common/converter.py +60 -0
mfs_server/common/embedding.py +132 -0
mfs_server/common/embeddings/__init__.py +85 -0
mfs_server/common/embeddings/gemini.py +79 -0
mfs_server/common/embeddings/local.py +79 -0
mfs_server/common/embeddings/ollama.py +47 -0
mfs_server/common/embeddings/onnx.py +196 -0
mfs_server/common/embeddings/openai.py +85 -0
mfs_server/common/embeddings/utils.py +33 -0
mfs_server/common/embeddings/voyage.py +69 -0
mfs_server/common/llm/__init__.py +77 -0
mfs_server/common/llm/anthropic.py +72 -0
mfs_server/common/llm/gemini.py +62 -0
mfs_server/common/llm/openai.py +64 -0
mfs_server/common/retrieval.py +125 -0
mfs_server/common/summary.py +93 -0
mfs_server/common/vlm.py +91 -0
mfs_server/config.py +530 -0
mfs_server/connectors/__init__.py +0 -0
mfs_server/connectors/base.py +575 -0
mfs_server/connectors/bigquery/__init__.py +4 -0
mfs_server/connectors/bigquery/plugin.py +239 -0
mfs_server/connectors/discord/__init__.py +4 -0
mfs_server/connectors/discord/plugin.py +255 -0
mfs_server/connectors/feishu/__init__.py +4 -0
mfs_server/connectors/feishu/auth_login.py +132 -0
mfs_server/connectors/feishu/oauth.py +207 -0
mfs_server/connectors/feishu/plugin.py +659 -0
mfs_server/connectors/file/__init__.py +4 -0
mfs_server/connectors/file/plugin.py +589 -0
mfs_server/connectors/gdrive/__init__.py +4 -0
mfs_server/connectors/gdrive/plugin.py +251 -0
mfs_server/connectors/github/__init__.py +4 -0
mfs_server/connectors/github/plugin.py +327 -0
mfs_server/connectors/gmail/__init__.py +4 -0
mfs_server/connectors/gmail/plugin.py +214 -0
mfs_server/connectors/hubspot/__init__.py +4 -0
mfs_server/connectors/hubspot/plugin.py +181 -0
mfs_server/connectors/jira/__init__.py +4 -0
mfs_server/connectors/jira/plugin.py +210 -0
mfs_server/connectors/linear/__init__.py +4 -0
mfs_server/connectors/linear/plugin.py +196 -0
mfs_server/connectors/mongo/__init__.py +4 -0
mfs_server/connectors/mongo/plugin.py +217 -0
mfs_server/connectors/mysql/__init__.py +4 -0
mfs_server/connectors/mysql/plugin.py +276 -0
mfs_server/connectors/notion/__init__.py +4 -0
mfs_server/connectors/notion/plugin.py +239 -0
mfs_server/connectors/postgres/__init__.py +4 -0
mfs_server/connectors/postgres/plugin.py +303 -0
mfs_server/connectors/registry.py +56 -0
mfs_server/connectors/s3/__init__.py +4 -0
mfs_server/connectors/s3/plugin.py +155 -0
mfs_server/connectors/slack/__init__.py +4 -0
mfs_server/connectors/slack/plugin.py +229 -0
mfs_server/connectors/snowflake/__init__.py +4 -0
mfs_server/connectors/snowflake/plugin.py +356 -0
mfs_server/connectors/web/__init__.py +4 -0
mfs_server/connectors/web/plugin.py +239 -0
mfs_server/connectors/zendesk/__init__.py +4 -0
mfs_server/connectors/zendesk/plugin.py +200 -0
mfs_server/engine/__init__.py +0 -0
mfs_server/engine/adapters.py +135 -0
mfs_server/engine/engine.py +2984 -0
mfs_server/engine/job_lane/__init__.py +318 -0
mfs_server/engine/job_lane/queue.py +53 -0
mfs_server/engine/job_lane/tree.py +105 -0
mfs_server/engine/job_lane/worker.py +116 -0
mfs_server/engine/job_watcher.py +120 -0
mfs_server/engine/pipeline.py +409 -0
mfs_server/engine/producers/__init__.py +79 -0
mfs_server/engine/producers/base.py +195 -0
mfs_server/engine/producers/image.py +52 -0
mfs_server/engine/producers/message_stream.py +132 -0
mfs_server/engine/producers/record_collection.py +125 -0
mfs_server/engine/producers/render.py +156 -0
mfs_server/engine/producers/table_schema.py +70 -0
mfs_server/engine/producers/text.py +140 -0
mfs_server/engine/state.py +79 -0
mfs_server/processors/__init__.py +0 -0
mfs_server/processors/text.py +75 -0
mfs_server/server/__init__.py +0 -0
mfs_server/server/__main__.py +155 -0
mfs_server/server/connector_schemas.py +436 -0
mfs_server/server/connector_wizard.py +802 -0
mfs_server/server/setup_wizard.py +682 -0
mfs_server/server/wizard_ui.py +223 -0
mfs_server/storage/__init__.py +0 -0
mfs_server/storage/artifact_cache.py +79 -0
mfs_server/storage/file_state.py +103 -0
mfs_server/storage/ids.py +64 -0
mfs_server/storage/metadata/__init__.py +44 -0
mfs_server/storage/metadata/base.py +234 -0
mfs_server/storage/metadata/postgres.py +70 -0
mfs_server/storage/metadata/sqlite.py +72 -0
mfs_server/storage/milvus.py +468 -0
mfs_server/storage/transformation_cache/__init__.py +45 -0
mfs_server/storage/transformation_cache/base.py +137 -0
mfs_server/storage/transformation_cache/postgres.py +86 -0
mfs_server/storage/transformation_cache/sqlite.py +80 -0
mfs_server-0.4.0.dist-info/METADATA +159 -0
mfs_server-0.4.0.dist-info/RECORD +110 -0
mfs_server-0.4.0.dist-info/WHEEL +4 -0
mfs_server-0.4.0.dist-info/entry_points.txt +2 -0

mfs_server/__init__.py ADDED Viewed

File without changes

mfs_server/api/__init__.py ADDED Viewed

File without changes

mfs_server/api/app.py ADDED Viewed

@@ -0,0 +1,645 @@
+"""FastAPI /v1 control plane. Thin HTTP wrappers over Engine.
+Typed request/response models (api/models.py) make the generated OpenAPI rich enough
+for the multi-language SDKs. `add` indexes inline by default (returns job_id when done)
+or enqueues for the standalone worker when process=false.
+"""
+from __future__ import annotations
+import asyncio
+from contextlib import asynccontextmanager
+from typing import Literal
+from fastapi import FastAPI, HTTPException, Request
+from fastapi.exceptions import RequestValidationError
+from fastapi.openapi.utils import get_openapi
+from fastapi.responses import JSONResponse
+from starlette.datastructures import Headers
+from starlette.exceptions import HTTPException as StarletteHTTPException
+from starlette.requests import ClientDisconnect
+from ..config import ServerConfig, load_server_config
+from ..engine.engine import Engine
+from .models import (
+    AddRequest,
+    AddResponse,
+    CancelResponse,
+    CatMeta,
+    CatResponse,
+    EstimateResponse,
+    ErrorResponse,
+    GrepResponse,
+    JobResponse,
+    LsResponse,
+    ManifestRequest,
+    ManifestResponse,
+    ProbeRequest,
+    ProbeResponse,
+    RemoveResponse,
+    SearchResponse,
+    ServerInfo,
+    StatusResponse,
+)
+# Canonical error codes -> suggested next actions. The endpoints
+# raise HTTPException with the canonical code as `detail` for these cases; the handler
+# below turns that into the stable {code, detail, suggestions} envelope SDKs switch on.
+_CODE_SUGGESTIONS = {
+    "object_too_large_for_cat": ["head", "cat --range", "export"],
+    "is_directory": ["ls", "tree"],
+    "range_unsupported": ["cat --meta", "export"],
+    "density_unsupported": ["head", "cat --range"],
+    "tail_unsupported": ["head", "cat --range"],
+    "locator_not_found": ["re-search; the record may have changed"],
+    "since_unsupported": ["drop --since"],
+    "sync_already_running": ["mfs job list", "mfs job cancel JOB_ID"],
+    "connector_removing": ["wait for removal to finish, then retry"],
+    "remove_requires_connector_root": [
+        "pass the registered connector root from `mfs connector list` or `mfs connector inspect`"
+    ],
+    "connector_unhealthy": ["check credentials/connectivity"],
+    "embedding_auth_failed": ["fix the embedding provider API key, then `mfs add` again"],
+    "embedding_quota_exceeded": [
+        "top up the embedding provider quota/billing, then `mfs add` again"
+    ],
+    "field_missing": [
+        "fix the connector `[[objects]]` text_fields — a configured field is absent from the records"
+    ],
+    "not_found": ["check the URI"],
+    "not_available": ["the connector may require an optional dependency; install its extra"],
+    "top_k_too_large": [
+        "lower --top-k: it exceeds the vector store's result limit (hybrid mode over-fetches, so its effective limit is higher than top_k)"
+    ],
+    "embedding_dim_mismatch": [
+        "the embedding dimension doesn't match this collection's vectors (the collection name encodes its dim)",
+        "re-run `mfs-server setup --section embedding` to set the correct dim, or re-index into a fresh collection",
+    ],
+    "validation_error": ["fix request shape"],
+}
+# HTTP status -> code when `detail` isn't already a canonical code (human strings).
+_STATUS_CODE = {
+    400: "bad_request",
+    404: "not_found",
+    405: "method_not_allowed",
+    409: "conflict",
+    422: "validation_error",
+    499: "client_closed_request",
+    501: "not_available",
+    502: "connector_unhealthy",
+}
+_OPENAPI_ERROR_RESPONSES = {
+    "400": "Bad Request",
+    "401": "Unauthorized",
+    "404": "Not Found",
+    "405": "Method Not Allowed",
+    "422": "Validation Error",
+    "500": "Internal Server Error",
+}
+_OPENAPI_METHODS = {"get", "post", "put", "patch", "delete", "options", "head"}
+def _error_response_ref(description: str) -> dict:
+    return {
+        "description": description,
+        "content": {"application/json": {"schema": {"$ref": "#/components/schemas/ErrorResponse"}}},
+    }
+def _install_openapi_contract(app: FastAPI, cfg: ServerConfig) -> None:
+    """Keep generated OpenAPI aligned with auth middleware and error handlers."""
+    def custom_openapi() -> dict:
+        if app.openapi_schema:
+            return app.openapi_schema
+        schema = get_openapi(
+            title=app.title,
+            version=app.version,
+            description=app.description,
+            routes=app.routes,
+        )
+        components = schema.setdefault("components", {})
+        schemas = components.setdefault("schemas", {})
+        schemas["ErrorResponse"] = ErrorResponse.model_json_schema(
+            ref_template="#/components/schemas/{model}"
+        )
+        auth_enabled = bool(cfg.auth_token)
+        if auth_enabled:
+            components.setdefault("securitySchemes", {})["BearerAuth"] = {
+                "type": "http",
+                "scheme": "bearer",
+                "bearerFormat": "opaque",
+            }
+            schema["security"] = [{"BearerAuth": []}]
+        for path, path_item in schema.get("paths", {}).items():
+            for method, operation in path_item.items():
+                if method not in _OPENAPI_METHODS:
+                    continue
+                if auth_enabled:
+                    operation["security"] = [] if path == "/healthz" else [{"BearerAuth": []}]
+                if path == "/healthz":
+                    continue
+                responses = operation.setdefault("responses", {})
+                for status, description in _OPENAPI_ERROR_RESPONSES.items():
+                    if status == "401" and not auth_enabled:
+                        continue
+                    responses[status] = _error_response_ref(description)
+        schemas.pop("HTTPValidationError", None)
+        schemas.pop("ValidationError", None)
+        app.openapi_schema = schema
+        return app.openapi_schema
+    app.openapi = custom_openapi
+def _auth_failure(headers: Headers, expected_token: str) -> tuple[int, dict] | None:
+    values = headers.getlist("authorization")
+    if len(values) > 1:
+        return (
+            400,
+            {
+                "code": "bad_request",
+                "detail": "duplicate Authorization header",
+                "suggestions": ["send exactly one Authorization: Bearer <token> header"],
+            },
+        )
+    if len(values) != 1:
+        return _unauthorized()
+    scheme, sep, token = values[0].partition(" ")
+    if sep != " " or scheme.lower() != "bearer" or token != expected_token:
+        return _unauthorized()
+    return None
+def _unauthorized() -> tuple[int, dict]:
+    return (
+        401,
+        {
+            "code": "unauthorized",
+            "detail": "missing or invalid bearer token",
+            "suggestions": ["set a profile token (Authorization: Bearer <token>)"],
+        },
+    )
+def _reject_unknown_query_params(request: Request, allowed: set[str]) -> None:
+    unknown = sorted({key for key, _ in request.query_params.multi_items()} - allowed)
+    if unknown:
+        joined = ", ".join(unknown)
+        raise HTTPException(422, f"unknown query parameter(s): {joined}")
+def create_app(cfg: ServerConfig | None = None, *, preload_local_models: bool = False) -> FastAPI:
+    cfg = cfg or load_server_config()
+    @asynccontextmanager
+    async def lifespan(app: FastAPI):
+        eng = Engine(cfg)
+        await eng.startup(preload_local_models=preload_local_models)
+        app.state.engine = eng
+        # AIO (sqlite/single-binary): there is no separate worker process, so an enqueued
+        # (--no-process) job would sit 'queued' forever. Drain it with one in-process worker.
+        # CS (postgres) deployments run a dedicated `mfs-server worker`; skip there unless
+        # explicitly turned on, so API replicas don't also do indexing work.
+        worker_task = None
+        if cfg.server.in_process_jobrunner and eng.meta.backend == "sqlite":
+            worker_task = asyncio.create_task(eng.run_worker_forever(concurrency=1))
+        try:
+            yield
+        finally:
+            if worker_task is not None:
+                worker_task.cancel()
+                try:
+                    await worker_task
+                except (asyncio.CancelledError, Exception):  # noqa: BLE001
+                    pass
+            await eng.shutdown()
+    app = FastAPI(
+        title="MFS",
+        version="0.4.0",
+        lifespan=lifespan,
+        description="Multi-source File-like Search — HTTP /v1 control plane.",
+    )
+    _install_openapi_contract(app, cfg)
+    if cfg.auth_token:
+        @app.middleware("http")
+        async def _auth(request: Request, call_next):
+            """Bearer-token gate: when auth_token is configured,
+            every request — loopback included — must carry Authorization: Bearer <token>.
+            /healthz is exempt so k8s/compose liveness probes don't need the token (it
+            returns no data) — see deployments/."""
+            if request.url.path == "/healthz":
+                return await call_next(request)
+            if failure := _auth_failure(request.headers, cfg.auth_token):
+                status_code, content = failure
+                return JSONResponse(status_code=status_code, content=content)
+            return await call_next(request)
+    @app.exception_handler(StarletteHTTPException)
+    async def _http_exc(_request: Request, exc: StarletteHTTPException) -> JSONResponse:
+        """Wrap HTTPException into the {code, detail, suggestions} envelope.
+        When `detail` is already a canonical code, surface it as `code`; otherwise derive
+        `code` from the HTTP status and keep the human string as `detail`."""
+        detail = exc.detail if isinstance(exc.detail, str) else "error"
+        code = detail if detail in _CODE_SUGGESTIONS else _STATUS_CODE.get(exc.status_code, "error")
+        return JSONResponse(
+            status_code=exc.status_code,
+            content={
+                "code": code,
+                "detail": detail,
+                "suggestions": _CODE_SUGGESTIONS.get(code, []),
+            },
+            headers=getattr(exc, "headers", None),
+        )
+    @app.exception_handler(RequestValidationError)
+    async def _val_exc(_request: Request, exc: RequestValidationError) -> JSONResponse:
+        # Build the detail from only each error's location + message — deliberately DROP
+        # pydantic's `input`/`url`/`ctx` fields. `input` echoes the submitted value (which
+        # for a config body can be a live secret) and `url` carries the server source path;
+        # `str(exc)` would leak both. Keep `detail` a plain string so the envelope shape is
+        # unchanged for SDK consumers.
+        parts = []
+        for err in exc.errors():
+            loc = ".".join(str(p) for p in err.get("loc", ()) if p != "body")
+            msg = err.get("msg", "invalid")
+            parts.append(f"{loc}: {msg}" if loc else msg)
+        return JSONResponse(
+            status_code=422,
+            content={
+                "code": "validation_error",
+                "detail": "; ".join(parts) or "validation error",
+                "suggestions": ["fix request shape"],
+            },
+        )
+    @app.exception_handler(NotImplementedError)
+    async def _not_impl_exc(_request: Request, exc: NotImplementedError) -> JSONResponse:
+        """A requested connector scheme has no registered plugin — usually because its
+        optional extra isn't installed (registry.load_builtin skips connectors whose
+        import fails). Return a clean 501 envelope instead of a 500 + traceback, with an
+        actionable hint to install the connector's extra."""
+        detail = str(exc) or "not implemented"
+        # message shape is "no plugin for <scheme>": surface an install hint for that extra.
+        # The extra name usually equals the URI scheme, but a few differ because the SDK is
+        # shared/renamed: postgres's extra is `pg` (asyncpg), and gdrive/gmail share `google`
+        # (google-api-python-client). Map those so the hint names a command that exists
+        # (`uv sync --extra postgres` would fail — the real extra is `pg`).
+        _SCHEME_TO_EXTRA = {"postgres": "pg", "gdrive": "google", "gmail": "google"}
+        scheme = detail.rsplit(" ", 1)[-1] if detail.startswith("no plugin for ") else None
+        extra = _SCHEME_TO_EXTRA.get(scheme, scheme) if scheme else None
+        suggestions = (
+            [f"install the connector extra: uv sync --extra {extra}"]
+            if scheme
+            else _CODE_SUGGESTIONS["not_available"]
+        )
+        return JSONResponse(
+            status_code=501,
+            content={"code": "not_available", "detail": detail, "suggestions": suggestions},
+        )
+    @app.exception_handler(Exception)
+    async def _unhandled_exc(_request: Request, exc: Exception) -> JSONResponse:
+        """Any uncaught error still returns the stable envelope so SDKs can switch on
+        `code` instead of parsing a raw 500 body."""
+        return JSONResponse(
+            status_code=500,
+            content={"code": "internal_error", "detail": str(exc), "suggestions": []},
+        )
+    def eng() -> Engine:
+        return app.state.engine
+    @app.get(
+        "/v1/server/info", response_model=ServerInfo, operation_id="getServerInfo", tags=["server"]
+    )
+    async def server_info() -> ServerInfo:
+        import socket
+        return ServerInfo(version="0.4.0", machine_id=socket.gethostname(), namespace=cfg.namespace)
+    @app.post("/v1/add", response_model=AddResponse, operation_id="addSource", tags=["ingest"])
+    async def add(body: AddRequest) -> AddResponse:
+        try:
+            job_id = await eng().add(
+                body.target,
+                config=body.config,
+                full=body.full,
+                since=body.since,
+                process=body.process,
+                update_config=body.update,
+            )
+        except ValueError as e:
+            code = str(e)
+            status = 409 if code in ("sync_already_running", "connector_removing") else 400
+            raise HTTPException(status, code)  # -> error envelope
+        return AddResponse(job_id=job_id)
+    @app.post(
+        "/v1/jobs/{job_id}/cancel",
+        response_model=CancelResponse,
+        operation_id="cancelJob",
+        tags=["ingest"],
+    )
+    async def cancel_job(job_id: str) -> CancelResponse:
+        ok = await eng().cancel_job(job_id)
+        return CancelResponse(job_id=job_id, cancelled=ok)
+    @app.post(
+        "/v1/connectors/probe",
+        response_model=ProbeResponse,
+        operation_id="probeConnector",
+        tags=["connectors"],
+    )
+    async def probe(body: ProbeRequest) -> ProbeResponse:
+        return ProbeResponse(**await eng().probe(body.target, body.config))
+    @app.post(
+        "/v1/connectors/estimate",
+        response_model=EstimateResponse,
+        operation_id="estimateConnector",
+        tags=["connectors"],
+    )
+    async def estimate(body: ProbeRequest) -> EstimateResponse:
+        """Zero-billing pre-flight estimate: object/chunk/token counts via
+        metadata + a local chunker/tokenizer dry-run. No embedding API calls."""
+        try:
+            return EstimateResponse(
+                **await eng().estimate(body.target, body.config, since=body.since)
+            )
+        except ValueError as e:
+            # e.g. an unreachable / missing source root surfaces as connector_unhealthy;
+            # return the clean envelope instead of a raw 500.
+            raise HTTPException(400, str(e))
+    @app.get("/v1/connectors/inspect", operation_id="inspectConnector", tags=["connectors"])
+    async def inspect(target: str):
+        out = await eng().inspect(target)
+        if out is None:
+            raise HTTPException(404, "connector not found")
+        return out
+    @app.delete(
+        "/v1/connectors",
+        response_model=RemoveResponse,
+        operation_id="removeConnector",
+        tags=["connectors"],
+    )
+    async def remove(target: str) -> RemoveResponse:
+        try:
+            return RemoveResponse(target=target, removed=await eng().remove_connector(target))
+        except ValueError as e:
+            raise HTTPException(400, str(e))
+    @app.post(
+        "/v1/upload", response_model=AddResponse, operation_id="uploadSource", tags=["ingest"]
+    )
+    async def upload(request: Request, name: str, process: bool = True) -> AddResponse:
+        """CS upload flow: POST a tar(.gz) of a tree as the raw body (?name=<label>);
+        the server stages + indexes it. For client/server without a shared filesystem."""
+        try:
+            data = await request.body()
+        except ClientDisconnect:
+            raise HTTPException(499, "client disconnected during upload")
+        if not data:
+            raise HTTPException(400, "empty upload body")
+        try:
+            out = await eng().ingest_upload(name, data, process=process)
+        except ValueError as e:
+            raise HTTPException(400, str(e))
+        return AddResponse(job_id=out["job_id"])
+    @app.post(
+        "/v1/files/manifest",
+        response_model=ManifestResponse,
+        operation_id="filesManifest",
+        tags=["ingest"],
+    )
+    async def files_manifest(body: ManifestRequest) -> ManifestResponse:
+        """Manifest-diff upload step ②: stat-only manifest in, need_sha1 + deletion
+        candidates out. No bytes transferred here."""
+        out = await eng().files_manifest(
+            body.client_id, body.root, [f.model_dump() for f in body.files]
+        )
+        return ManifestResponse(**out)
+    @app.put(
+        "/v1/files/upload", response_model=AddResponse, operation_id="filesUpload", tags=["ingest"]
+    )
+    async def files_upload(
+        request: Request, client_id: str, root: str, process: bool = True, full: bool = False
+    ) -> AddResponse:
+        """Manifest-diff upload step ④: PUT a tar(.gz) carrying a `.mfs-meta.json`
+        member (hashes/renames/deletions) + the changed file bytes. The server applies
+        it to the staging area and triggers the file-connector sync. full=true
+        (--force-index/--force-upload) forces a re-index of the whole staged tree."""
+        try:
+            data = await request.body()
+        except ClientDisconnect:
+            raise HTTPException(499, "client disconnected during upload")
+        if not data:
+            raise HTTPException(400, "empty upload body")
+        try:
+            out = await eng().files_upload(client_id, root, data, process=process, full=full)
+        except ValueError as e:
+            raise HTTPException(400, str(e))
+        return AddResponse(job_id=out["job_id"])
+    @app.get("/v1/search", response_model=SearchResponse, operation_id="search", tags=["retrieval"])
+    async def search(
+        request: Request,
+        q: str,
+        path: str | None = None,
+        mode: Literal["hybrid", "semantic", "keyword"] = "hybrid",
+        top_k: int = 10,
+        collapse: bool = False,
+        kind: str | None = None,
+    ) -> SearchResponse:
+        _reject_unknown_query_params(request, {"q", "path", "mode", "top_k", "collapse", "kind"})
+        connector_uri = None
+        object_prefix = None
+        if path:
+            connector_uri, object_prefix = await eng().resolve_connector_uri(path)
+        # comma-separated chunk_kinds, e.g. ?kind=body,directory_summary
+        chunk_kinds = [k.strip() for k in kind.split(",") if k.strip()] if kind else None
+        try:
+            results = await eng().search(
+                q,
+                connector_uri=connector_uri,
+                object_prefix=object_prefix,
+                mode=mode,
+                top_k=top_k,
+                chunk_kinds=chunk_kinds,
+                collapse=collapse,
+            )
+        except ValueError as e:
+            raise HTTPException(400, str(e))
+        return SearchResponse(results=results)
+    @app.get("/v1/grep", response_model=GrepResponse, operation_id="grep", tags=["retrieval"])
+    async def grep(pattern: str, path: str) -> GrepResponse:
+        # A scope path that resolves under no connector raises ValueError ("path not under
+        # any registered connector") from _open_path — map it to a clean 404 like ls/cat
+        # instead of letting it escape as a raw 500 (search returns [] for the same case;
+        # grep follows the browse family's explicit not_found here).
+        try:
+            return GrepResponse(results=await eng().grep(pattern, path))
+        except (FileNotFoundError, NotADirectoryError, ValueError) as e:
+            raise HTTPException(404, str(e))
+    @app.get("/v1/ls", response_model=LsResponse, operation_id="ls", tags=["browse"])
+    async def ls(path: str) -> LsResponse:
+        try:
+            return LsResponse(**await eng().ls(path))
+        except (FileNotFoundError, NotADirectoryError, ValueError) as e:
+            raise HTTPException(404, str(e))
+    @app.get(
+        "/v1/cat",
+        operation_id="cat",
+        tags=["browse"],
+        response_model=None,
+        responses={200: {"model": CatResponse}},
+    )
+    async def cat(
+        path: str,
+        range: str | None = None,
+        meta: bool = False,
+        density: str | None = None,
+        locator: str | None = None,
+    ):
+        import json as _json
+        rg = None
+        if range:
+            # External --range is 1-based half-open [start, end) — matches
+            # locator.lines, head/tail line counts, and how humans cite ranges
+            # ("lines 100 to 200"). Require an explicit colon so a bare "100"
+            # doesn't silently degrade to a single line or an open end. Convert
+            # to 0-based half-open here; engine.cat + plugin.read stay 0-based
+            # internally.
+            if ":" not in range:
+                raise HTTPException(
+                    400, "invalid range: expected start:end (1-based, end-exclusive)"
+                )
+            a, _, b = range.partition(":")
+            try:
+                start_1 = int(a) if a.strip() else 1
+                end_1 = int(b) if b.strip() else (2**63 - 1)
+            except ValueError:
+                raise HTTPException(400, "invalid range")
+            if start_1 < 1:
+                raise HTTPException(400, "invalid range: start must be >= 1")
+            if end_1 < start_1:
+                raise HTTPException(400, "invalid range: end must be >= start")
+            rg = (start_1 - 1, end_1 - 1)
+        loc = None
+        if locator:
+            try:
+                loc = _json.loads(locator)
+            except ValueError:
+                raise HTTPException(400, "invalid locator JSON")
+        try:
+            out = await eng().cat(path, range=rg, meta=meta, density=density, locator=loc)
+        except IsADirectoryError:
+            raise HTTPException(400, "is_directory")
+        except ValueError as e:
+            code = str(e)
+            if code in ("density_unsupported", "range_unsupported", "object_too_large_for_cat"):
+                raise HTTPException(400, code)
+            if code == "locator_not_found":
+                raise HTTPException(404, "locator_not_found")
+            raise HTTPException(404, code)
+        except FileNotFoundError as e:
+            raise HTTPException(404, str(e))
+        if meta:
+            return CatMeta(**out) if isinstance(out, dict) else out
+        if isinstance(out, dict):  # locator hit -> {source, locator, content}
+            return CatResponse(source=out.get("source", path), content=out.get("content", ""))
+        return CatResponse(source=path, content=out)
+    async def _read_op(fn, path: str):
+        """Shared error mapping for head/tail/export."""
+        try:
+            return await fn(path)
+        except IsADirectoryError:
+            raise HTTPException(400, "is_directory")
+        except FileNotFoundError as e:
+            raise HTTPException(404, str(e))
+        except ValueError as e:
+            raise HTTPException(400, str(e))
+    @app.get("/v1/head", response_model=CatResponse, operation_id="head", tags=["browse"])
+    async def head(path: str, n: int = 20) -> CatResponse:
+        return CatResponse(source=path, content=await _read_op(lambda p: eng().head(p, n), path))
+    @app.get("/v1/tail", response_model=CatResponse, operation_id="tail", tags=["browse"])
+    async def tail(path: str, n: int = 20) -> CatResponse:
+        return CatResponse(source=path, content=await _read_op(lambda p: eng().tail(p, n), path))
+    @app.get("/v1/export", response_model=CatResponse, operation_id="export", tags=["browse"])
+    async def export(path: str) -> CatResponse:
+        """Full object content for `mfs export`. Honest about completeness:
+        each connector's own row cap still applies (postgres `max_read_rows`,
+        BigQuery `max_read_rows`, etc.), so structured objects above that
+        threshold return `partial=true`. The bare-cat size guard
+        (object_too_large_for_cat) does NOT apply — export is the escape
+        hatch for that — but true streaming export is still TODO."""
+        text, partial = await _read_op(eng().export, path)
+        return CatResponse(source=path, content=text, partial=partial)
+    @app.get("/healthz", tags=["server"])
+    async def healthz() -> dict:
+        """Unauthenticated liveness/readiness probe (no sensitive data); used by the
+        compose healthcheck and Helm probes so they work even with auth enabled."""
+        return {"status": "ok"}
+    @app.get("/v1/status", response_model=StatusResponse, operation_id="status", tags=["server"])
+    async def status() -> StatusResponse:
+        # Per-connector object/chunk counts come from the metadata `objects` table
+        # (objects.chunk_count is already maintained per object). One grouped LEFT JOIN —
+        # connectors with nothing indexed yet still report 0/0 — so status surfaces store
+        # state without a full Milvus scan.
+        conns = await eng().meta.fetchall(
+            "SELECT c.root_uri AS root_uri, c.type AS type, c.status AS status, "
+            "  COUNT(o.object_uri) AS object_count, "
+            "  COALESCE(SUM(o.chunk_count), 0) AS chunk_count "
+            "FROM connectors c LEFT JOIN objects o ON o.connector_id = c.id "
+            "WHERE c.namespace_id=? GROUP BY c.id, c.root_uri, c.type, c.status",
+            (cfg.namespace,),
+        )
+        jobs = await eng().meta.fetchall(
+            "SELECT status, count(*) AS n FROM connector_jobs GROUP BY status"
+        )
+        return StatusResponse(
+            connectors=[dict(c) for c in conns], jobs={j["status"]: j["n"] for j in jobs}
+        )
+    @app.get("/v1/jobs", response_model=list[JobResponse], operation_id="listJobs", tags=["ingest"])
+    async def list_jobs(limit: int = 20) -> list[JobResponse]:
+        rows = await eng().meta.fetchall(
+            "SELECT * FROM connector_jobs ORDER BY started_at DESC LIMIT ?", (limit,)
+        )
+        return [JobResponse(**{k: dict(r).get(k) for k in JobResponse.model_fields}) for r in rows]
+    @app.get(
+        "/v1/jobs/{job_id}", response_model=JobResponse, operation_id="getJob", tags=["ingest"]
+    )
+    async def job(job_id: str) -> JobResponse:
+        row = await eng().meta.fetchone("SELECT * FROM connector_jobs WHERE id=?", (job_id,))
+        if not row:
+            raise HTTPException(404, "job not found")
+        return JobResponse(**{k: dict(row).get(k) for k in JobResponse.model_fields})
+    return app