npm - @hypabolic/crossbar - Versions diffs - 0.1.0 - Mend

@hypabolic/crossbar 0.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (29) hide show

package/ARCHITECTURE.md +168 -0
package/CAPABILITY-MATRIX.md +49 -0
package/LICENSE +21 -0
package/README.md +127 -0
package/RESEARCH.md +343 -0
package/package.json +53 -0
package/src/adapters/anthropic.ts +197 -0
package/src/adapters/generic.ts +164 -0
package/src/adapters/index.ts +64 -0
package/src/adapters/llamacpp.ts +217 -0
package/src/adapters/llamaswap.ts +276 -0
package/src/adapters/lmstudio.ts +307 -0
package/src/adapters/ollama.ts +340 -0
package/src/adapters/openai.ts +195 -0
package/src/adapters/vllm.ts +197 -0
package/src/core/backend-adapter.ts +123 -0
package/src/core/capability.ts +53 -0
package/src/core/index.ts +36 -0
package/src/core/types.ts +160 -0
package/src/discovery/engine.ts +247 -0
package/src/discovery/probe.ts +144 -0
package/src/index.ts +158 -0
package/src/registry/ids.ts +68 -0
package/src/registry/persistence.ts +111 -0
package/src/registry/pi-credential-store.ts +27 -0
package/src/registry/registry.ts +150 -0
package/src/shim/provider-shim.ts +187 -0
package/src/ui/loaded-widget.ts +220 -0
package/src/ui/onboarding.ts +439 -0

package/src/adapters/llamaswap.ts ADDED Viewed

@@ -0,0 +1,276 @@
+/**
+ * llama-swap BackendAdapter
+ *
+ * llama-swap (mostlygeek/llama-swap) is a proxy front-door for llama-server instances that enables
+ * hot-swapping models at runtime. It exposes the llama-swap-specific /running and /upstream/{model}
+ * paths that distinguish it from a bare llama-server.
+ *
+ * Fingerprint: GET /running 200 (JSON) — a path that only llama-swap exposes.
+ * Inference base URL: server.baseUrl + "/v1"  (OpenAI + Anthropic compat front door).
+ */
+import { Capability } from "../core/capability.ts";
+import type { BackendAdapter, PiApiType } from "../core/backend-adapter.ts";
+import type {
+  DiscoveredServer,
+  HealthStatus,
+  LoadAction,
+  LoadedState,
+  ModelDescriptor,
+  PiModelEntry,
+  Probe,
+  ServerCredential,
+} from "../core/types.ts";
+// ---------------------------------------------------------------------------
+// Internal types
+// ---------------------------------------------------------------------------
+interface RunningBody {
+  id?: string;
+  model?: string;
+  models?: string[];
+  // llama-swap /running can return a single object or an array of running upstreams
+  [key: string]: unknown;
+}
+interface V1ModelsBody {
+  data?: Array<{
+    id: string;
+  }>;
+}
+// ---------------------------------------------------------------------------
+// Helpers
+// ---------------------------------------------------------------------------
+/** Extract running model ids from a /running response (handles various shapes). */
+function parseRunningIds(json: unknown): string[] {
+  if (!json || typeof json !== "object") return [];
+  // Array of running-upstream objects
+  if (Array.isArray(json)) {
+    return json.flatMap((item) => {
+      if (typeof item === "string") return [item];
+      if (item && typeof item === "object") {
+        const id = (item as RunningBody).id ?? (item as RunningBody).model;
+        return typeof id === "string" ? [id] : [];
+      }
+      return [];
+    });
+  }
+  const body = json as RunningBody;
+  // { models: [...] }
+  if (Array.isArray(body.models)) {
+    return body.models.filter((m): m is string => typeof m === "string");
+  }
+  // { id: "..." }
+  if (typeof body.id === "string") return [body.id];
+  // { model: "..." }
+  if (typeof body.model === "string") return [body.model];
+  return [];
+}
+// ---------------------------------------------------------------------------
+// LlamaswapAdapter
+// ---------------------------------------------------------------------------
+class LlamaswapAdapter implements BackendAdapter {
+  readonly kind = "llamaswap" as const;
+  readonly displayName = "llama-swap";
+  readonly defaultPorts: readonly number[] = [8080];
+  readonly piApi: PiApiType = "openai-completions";
+  readonly capabilities: ReadonlySet<Capability> = new Set<Capability>([
+    Capability.ListModels,
+    Capability.IntrospectLoaded,
+    Capability.SwitchModel,
+    Capability.LoadUnload,
+    Capability.Health,
+    Capability.Streaming,
+  ]);
+  // --- fingerprint ----------------------------------------------------------
+  async fingerprint(baseUrl: string, probe: Probe): Promise<DiscoveredServer | null> {
+    // /running is a llama-swap-only path — not present on bare llama-server.
+    const r = await probe("/running");
+    if (!r.ok) return null;
+    // Must parse as JSON (llama-swap returns JSON from /running, not plain text)
+    if (r.json === undefined && r.text !== undefined) {
+      // If text is not JSON, bail
+      try {
+        JSON.parse(r.text);
+      } catch {
+        return null;
+      }
+    }
+    return {
+      kind: "llamaswap",
+      baseUrl,
+      auth: "none",
+      label: `llama-swap (${baseUrl})`,
+      confidence: 0.9,
+    };
+  }
+  // --- health ---------------------------------------------------------------
+  async health(
+    _server: DiscoveredServer,
+    _cred: ServerCredential,
+    probe: Probe,
+  ): Promise<HealthStatus> {
+    const r = await probe("/health");
+    if (r.status === 0) return { state: "unreachable" };
+    if (r.status === 401) return { state: "unauthorized" };
+    if (!r.ok) return { state: "degraded" };
+    // llama-swap /health returns plain "OK" text
+    const isOk =
+      r.text?.trim().toUpperCase() === "OK" ||
+      (r.json && typeof r.json === "object" && (r.json as { status?: string }).status === "ok");
+    if (!isOk && r.text !== undefined && r.text.trim() !== "") {
+      return { state: "degraded" };
+    }
+    const status: HealthStatus = { state: "healthy" };
+    if (r.latencyMs !== undefined) status.latencyMs = r.latencyMs;
+    return status;
+  }
+  // --- listModels -----------------------------------------------------------
+  async listModels(
+    _server: DiscoveredServer,
+    _cred: ServerCredential,
+    probe: Probe,
+  ): Promise<ModelDescriptor[]> {
+    const r = await probe("/v1/models");
+    if (!r.ok) {
+      if (r.status === 401) throw new Error("401 Unauthorized");
+      if (r.status === 0) throw new Error("listModels failed: server unreachable");
+      throw new Error(`listModels failed: status ${r.status}`);
+    }
+    const body = r.json as V1ModelsBody | undefined;
+    const data = body?.data ?? [];
+    return data.map((entry) => ({
+      id: entry.id,
+      name: entry.id,
+      contextWindow: 8192,
+      maxTokens: 4096,
+      input: ["text"] as ("text" | "image")[],
+      reasoning: false,
+    }));
+  }
+  // --- introspectLoaded -----------------------------------------------------
+  async introspectLoaded(
+    _server: DiscoveredServer,
+    _cred: ServerCredential,
+    probe: Probe,
+  ): Promise<LoadedState> {
+    const r = await probe("/running");
+    if (!r.ok) {
+      if (r.status === 401) throw new Error("401 Unauthorized");
+      if (r.status === 0) throw new Error("introspectLoaded failed: server unreachable");
+      throw new Error(`introspectLoaded failed: status ${r.status}`);
+    }
+    const ids = parseRunningIds(r.json ?? r.text);
+    return {
+      loadedModelIds: ids,
+      source: "introspection",
+    };
+  }
+  // --- switchModel ----------------------------------------------------------
+  async switchModel(
+    _server: DiscoveredServer,
+    _cred: ServerCredential,
+    modelId: string,
+    probe: Probe,
+  ): Promise<void> {
+    // Step 1: GET /upstream/{model} — triggers llama-swap to start that upstream.
+    const r1 = await probe(`/upstream/${modelId}`);
+    if (!r1.ok) {
+      if (r1.status === 0) throw new Error("server unreachable during switchModel");
+      if (r1.status === 401) throw new Error("401 Unauthorized");
+      throw new Error(`switchModel: upstream request failed: status ${r1.status}`);
+    }
+    // Step 2: Confirm via GET /running that the target is now active.
+    const r2 = await probe("/running");
+    if (!r2.ok) {
+      if (r2.status === 0) throw new Error("server went down after switch request");
+      if (r2.status === 401) throw new Error("401 Unauthorized");
+      throw new Error(`switchModel: confirmation probe failed: status ${r2.status}`);
+    }
+    const runningIds = parseRunningIds(r2.json ?? r2.text);
+    if (!runningIds.includes(modelId)) {
+      throw new Error(`model-not-loaded: ${modelId} not found in /running after switch`);
+    }
+  }
+  // --- loadUnload -----------------------------------------------------------
+  async loadUnload(
+    _server: DiscoveredServer,
+    _cred: ServerCredential,
+    modelId: string,
+    action: LoadAction,
+    probe: Probe,
+  ): Promise<void> {
+    if (action === "load") {
+      // load: GET /upstream/{model}
+      const r = await probe(`/upstream/${modelId}`);
+      if (!r.ok) {
+        if (r.status === 0) throw new Error("server unreachable during load");
+        if (r.status === 401) throw new Error("401 Unauthorized");
+        throw new Error(`loadUnload(load) failed: status ${r.status}`);
+      }
+    } else {
+      // unload: POST /api/models/unload
+      const r = await probe(`/api/models/unload`, {
+        method: "POST",
+        body: JSON.stringify({ model: modelId }),
+        headers: { "content-type": "application/json" },
+      });
+      if (!r.ok) {
+        if (r.status === 0) throw new Error("server unreachable during unload");
+        if (r.status === 401) throw new Error("401 Unauthorized");
+        throw new Error(`loadUnload(unload) failed: status ${r.status}`);
+      }
+    }
+  }
+  // --- toPiModel ------------------------------------------------------------
+  toPiModel(_server: DiscoveredServer, model: ModelDescriptor): PiModelEntry {
+    return {
+      id: model.id,
+      name: model.name,
+      reasoning: model.reasoning ?? false,
+      input: model.input.length > 0 ? model.input : ["text"],
+      cost: { input: 0, output: 0, cacheRead: 0, cacheWrite: 0 },
+      contextWindow: model.contextWindow ?? 8192,
+      maxTokens: model.maxTokens ?? 4096,
+    };
+  }
+  // --- inferenceBaseUrl -----------------------------------------------------
+  inferenceBaseUrl(server: DiscoveredServer): string {
+    return `${server.baseUrl}/v1`;
+  }
+}
+// ---------------------------------------------------------------------------
+// Singleton export
+// ---------------------------------------------------------------------------
+export const llamaswapAdapter: BackendAdapter = new LlamaswapAdapter();

package/src/adapters/lmstudio.ts ADDED Viewed

@@ -0,0 +1,307 @@
+/**
+ * LM Studio backend adapter.
+ *
+ * Implements the BackendAdapter contract for LM Studio's local server.
+ * Uses the LM Studio-native /api/v0/* endpoints for discovery and management,
+ * and delegates inference to the OpenAI-compatible /v1/* layer.
+ *
+ * Key API endpoints:
+ *   GET  /api/v0/models            — model list with state, type, context lengths
+ *   POST /api/v1/models/load       — load a model by id
+ *   POST /api/v1/models/unload     — unload a model by id
+ *
+ * Fingerprint discriminator: data[] entries have both `state` and
+ * `compatibility_type` fields (unique to LM Studio's v0 API).
+ */
+import { Capability } from "../core/capability.ts";
+import type { BackendAdapter, PiApiType } from "../core/backend-adapter.ts";
+import type {
+  DiscoveredServer,
+  HealthStatus,
+  LoadAction,
+  LoadedState,
+  ModelDescriptor,
+  PiModelEntry,
+  Probe,
+  ServerCredential,
+} from "../core/types.ts";
+// ---------------------------------------------------------------------------
+// LM Studio API shapes (narrowed from unknown JSON)
+// ---------------------------------------------------------------------------
+interface LmsModelEntry {
+  id: string;
+  type?: string;                    // "llm" | "vlm" | "embeddings"
+  state?: string;                   // "loaded" | "not-loaded"
+  max_context_length?: number;
+  loaded_context_length?: number;
+  quantization?: string;
+  arch?: string;
+}
+interface LmsModelsResponse {
+  data?: LmsModelEntry[];
+}
+// ---------------------------------------------------------------------------
+// Helpers
+// ---------------------------------------------------------------------------
+/** Narrow an unknown JSON body to a LmsModelsResponse defensively. */
+function parseModelsBody(json: unknown): LmsModelsResponse {
+  if (json == null || typeof json !== "object") return {};
+  const obj = json as Record<string, unknown>;
+  const data = obj["data"];
+  if (!Array.isArray(data)) return {};
+  const entries: LmsModelEntry[] = [];
+  for (const item of data) {
+    if (item == null || typeof item !== "object") continue;
+    const m = item as Record<string, unknown>;
+    const entry: LmsModelEntry = {
+      id: typeof m["id"] === "string" ? m["id"] : String(m["id"] ?? ""),
+    };
+    if (typeof m["type"] === "string") entry.type = m["type"];
+    if (typeof m["state"] === "string") entry.state = m["state"];
+    if (typeof m["max_context_length"] === "number") entry.max_context_length = m["max_context_length"];
+    if (typeof m["loaded_context_length"] === "number") entry.loaded_context_length = m["loaded_context_length"];
+    if (typeof m["quantization"] === "string") entry.quantization = m["quantization"];
+    if (typeof m["arch"] === "string") entry.arch = m["arch"];
+    entries.push(entry);
+  }
+  return { data: entries };
+}
+/**
+ * Check that a parsed models response has the LM Studio discriminator:
+ * at least one entry with both `state` and `compatibility_type` (or we check
+ * `state` as the unique discriminator since compatibility_type is what the
+ * SPEC calls out; we check state on the actual fields we parse).
+ *
+ * The SPEC says: data[] entries have `state` and `compatibility_type`.
+ * We check for `state` field presence (which is definitively LM Studio).
+ */
+function hasLmsDiscriminator(json: unknown): boolean {
+  if (json == null || typeof json !== "object") return false;
+  const obj = json as Record<string, unknown>;
+  const data = obj["data"];
+  if (!Array.isArray(data) || data.length === 0) return false;
+  // Check that at least one entry has `state` (and optionally `compatibility_type`)
+  // The raw json (before parsing) has the original fields, so we check there
+  for (const item of data) {
+    if (item == null || typeof item !== "object") continue;
+    const m = item as Record<string, unknown>;
+    if ("state" in m && "compatibility_type" in m) return true;
+    // Some versions may only have state — still a strong signal
+    if ("state" in m) return true;
+  }
+  return false;
+}
+/** Map a LM Studio model entry to a Crossbar ModelDescriptor. */
+function toDescriptor(m: LmsModelEntry): ModelDescriptor {
+  const isEmbeddings = m.type === "embeddings";
+  const isVlm = m.type === "vlm";
+  const input: ("text" | "image")[] = ["text"];
+  if (isVlm) input.push("image");
+  const desc: ModelDescriptor = {
+    id: m.id,
+    name: m.id,
+    input,
+    embeddings: isEmbeddings,
+    loaded: m.state === "loaded",
+    raw: m,
+  };
+  if (m.max_context_length !== undefined) {
+    desc.contextWindow = m.max_context_length;
+  }
+  return desc;
+}
+// ---------------------------------------------------------------------------
+// LmStudioAdapter
+// ---------------------------------------------------------------------------
+class LmStudioAdapter implements BackendAdapter {
+  readonly kind = "lmstudio" as const;
+  readonly displayName = "LM Studio";
+  readonly defaultPorts: readonly number[] = [1234];
+  readonly piApi: PiApiType = "openai-completions";
+  readonly capabilities: ReadonlySet<Capability> = new Set<Capability>([
+    Capability.ListModels,
+    Capability.IntrospectLoaded,
+    Capability.SwitchModel,
+    Capability.LoadUnload,
+    Capability.Health,
+    Capability.PerModelCaps,
+    Capability.Streaming,
+  ]);
+  // --- fingerprint ----------------------------------------------------------
+  async fingerprint(baseUrl: string, probe: Probe): Promise<DiscoveredServer | null> {
+    const r = await probe("/api/v0/models");
+    if (!r.ok || r.status === 0) return null;
+    if (!hasLmsDiscriminator(r.json)) return null;
+    return {
+      kind: "lmstudio",
+      baseUrl,
+      auth: "none",
+      label: `LM Studio (${baseUrl.replace(/^https?:\/\//, "")})`,
+      confidence: 0.95,
+    };
+  }
+  // --- health ---------------------------------------------------------------
+  async health(
+    _server: DiscoveredServer,
+    _cred: ServerCredential,
+    probe: Probe,
+  ): Promise<HealthStatus> {
+    const r = await probe("/api/v0/models");
+    if (r.status === 0) return { state: "unreachable" };
+    if (r.status === 401) return { state: "unauthorized" };
+    if (!r.ok) return { state: "degraded" };
+    const status: HealthStatus = { state: "healthy" };
+    if (r.latencyMs !== undefined) status.latencyMs = r.latencyMs;
+    return status;
+  }
+  // --- listModels -----------------------------------------------------------
+  async listModels(
+    _server: DiscoveredServer,
+    _cred: ServerCredential,
+    probe: Probe,
+  ): Promise<ModelDescriptor[]> {
+    const r = await probe("/api/v0/models");
+    if (!r.ok) {
+      if (r.status === 401) throw new Error("401 Unauthorized");
+      if (r.status === 0) throw new Error("listModels failed: server unreachable");
+      throw new Error(`listModels failed: status ${r.status}`);
+    }
+    const body = parseModelsBody(r.json);
+    if (!body.data) return [];
+    return body.data.map(toDescriptor);
+  }
+  // --- introspectLoaded -----------------------------------------------------
+  async introspectLoaded(
+    _server: DiscoveredServer,
+    _cred: ServerCredential,
+    probe: Probe,
+  ): Promise<LoadedState> {
+    const r = await probe("/api/v0/models");
+    if (!r.ok) {
+      if (r.status === 401) throw new Error("401 Unauthorized");
+      if (r.status === 0) throw new Error("introspectLoaded failed: server unreachable");
+      throw new Error(`introspectLoaded failed: status ${r.status}`);
+    }
+    const body = parseModelsBody(r.json);
+    const loaded = (body.data ?? []).filter((m) => m.state === "loaded");
+    const perModel: Record<string, { contextLength: number }> = {};
+    for (const m of loaded) {
+      if (m.loaded_context_length !== undefined) {
+        perModel[m.id] = { contextLength: m.loaded_context_length };
+      }
+    }
+    const result: LoadedState = {
+      loadedModelIds: loaded.map((m) => m.id),
+      source: "introspection",
+    };
+    if (Object.keys(perModel).length > 0) {
+      result.perModel = perModel;
+    }
+    return result;
+  }
+  // --- switchModel ----------------------------------------------------------
+  async switchModel(
+    _server: DiscoveredServer,
+    _cred: ServerCredential,
+    modelId: string,
+    probe: Probe,
+  ): Promise<void> {
+    // Step 1: JIT load
+    const r1 = await probe("/api/v1/models/load", {
+      method: "POST",
+      body: JSON.stringify({ model: modelId }),
+      headers: { "content-type": "application/json" },
+    });
+    if (!r1.ok) {
+      if (r1.status === 0) throw new Error("switchModel failed: server unreachable");
+      if (r1.status === 401) throw new Error("401 Unauthorized");
+      throw new Error(`switchModel load failed: status ${r1.status}`);
+    }
+    // Step 2: Confirm via model list that the target is now loaded
+    const r2 = await probe("/api/v0/models");
+    if (!r2.ok) {
+      if (r2.status === 0) throw new Error("switchModel confirmation failed: server went down");
+      if (r2.status === 401) throw new Error("401 Unauthorized");
+      throw new Error(`switchModel confirmation failed: status ${r2.status}`);
+    }
+    const body = parseModelsBody(r2.json);
+    const found = (body.data ?? []).find((m) => m.id === modelId);
+    if (!found || found.state !== "loaded") {
+      throw new Error(`model-not-loaded: ${modelId} not found in loaded state after switch`);
+    }
+  }
+  // --- loadUnload -----------------------------------------------------------
+  async loadUnload(
+    _server: DiscoveredServer,
+    _cred: ServerCredential,
+    modelId: string,
+    action: LoadAction,
+    probe: Probe,
+  ): Promise<void> {
+    const path = action === "load"
+      ? "/api/v1/models/load"
+      : "/api/v1/models/unload";
+    const r = await probe(path, {
+      method: "POST",
+      body: JSON.stringify({ model: modelId }),
+      headers: { "content-type": "application/json" },
+    });
+    if (!r.ok) {
+      if (r.status === 0) throw new Error(`loadUnload(${action}) failed: server unreachable`);
+      if (r.status === 401) throw new Error("401 Unauthorized");
+      throw new Error(`loadUnload(${action}) failed: status ${r.status}`);
+    }
+  }
+  // --- toPiModel ------------------------------------------------------------
+  toPiModel(_server: DiscoveredServer, model: ModelDescriptor): PiModelEntry {
+    return {
+      id: model.id,
+      name: model.name,
+      reasoning: model.reasoning ?? false,
+      input: model.input.length > 0 ? (model.input as ("text" | "image")[]) : ["text"],
+      cost: { input: 0, output: 0, cacheRead: 0, cacheWrite: 0 },
+      contextWindow: model.contextWindow ?? 8192,
+      maxTokens: model.maxTokens ?? 4096,
+    };
+  }
+  // --- inferenceBaseUrl -----------------------------------------------------
+  inferenceBaseUrl(server: DiscoveredServer): string {
+    return `${server.baseUrl}/v1`;
+  }
+}
+// ---------------------------------------------------------------------------
+// Singleton export
+// ---------------------------------------------------------------------------
+export const lmstudioAdapter: BackendAdapter = new LmStudioAdapter();