npm - @fusionkit/ensemble - Versions diffs - 0.1.4 → 0.1.6 - Mend

@fusionkit/ensemble 0.1.4 → 0.1.6

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (21) hide show

package/dist/cursorkit-path.d.ts +17 -0
package/dist/cursorkit-path.js +21 -0
package/dist/harness.d.ts +7 -0
package/dist/harness.js +51 -1
package/dist/index.d.ts +5 -8
package/dist/index.js +3 -4
package/dist/run.js +2 -1
package/dist/test/ensemble.test.js +0 -227
package/dist/unified.d.ts +27 -3
package/dist/unified.js +35 -30
package/package.json +8 -7
package/dist/claude-code.d.ts +0 -25
package/dist/claude-code.js +0 -398
package/dist/codex.d.ts +0 -69
package/dist/codex.js +0 -467
package/dist/dashboard.d.ts +0 -62
package/dist/dashboard.js +0 -788
package/dist/test/codex.test.d.ts +0 -1
package/dist/test/codex.test.js +0 -237
package/dist/test/dashboard.test.d.ts +0 -1
package/dist/test/dashboard.test.js +0 -214

package/dist/cursorkit-path.d.ts ADDED Viewed

@@ -0,0 +1,17 @@
+export type CursorkitCli = {
+    /** Absolute path to the bridge entrypoint (`cursorkit serve`). */
+    serveCli: string;
+    /** Absolute path to the bundled test-harness CLI (suite probes). */
+    harnessCli: string;
+};
+/**
+ * Resolve the bundled `@velum-labs/cursorkit` CLIs from node_modules. The
+ * package exports `"."` -> `dist/src/cli.js`; the harness CLI lives next to it
+ * at `dist/src/testing/cli.js` (not exposed via the exports map, so it is
+ * derived from the resolved `"."` entry rather than resolved directly).
+ *
+ * `FUSIONKIT_CURSORKIT_SERVE_CLI` overrides the resolved `serveCli` entry. This
+ * lets a custom build (or an integration test) point the bridge at an alternate
+ * entrypoint; the harness CLI is still derived relative to it.
+ */
+export declare function resolveCursorkitCli(): CursorkitCli;

package/dist/cursorkit-path.js ADDED Viewed

@@ -0,0 +1,21 @@
+import { createRequire } from "node:module";
+import { dirname, join } from "node:path";
+const require = createRequire(import.meta.url);
+/**
+ * Resolve the bundled `@velum-labs/cursorkit` CLIs from node_modules. The
+ * package exports `"."` -> `dist/src/cli.js`; the harness CLI lives next to it
+ * at `dist/src/testing/cli.js` (not exposed via the exports map, so it is
+ * derived from the resolved `"."` entry rather than resolved directly).
+ *
+ * `FUSIONKIT_CURSORKIT_SERVE_CLI` overrides the resolved `serveCli` entry. This
+ * lets a custom build (or an integration test) point the bridge at an alternate
+ * entrypoint; the harness CLI is still derived relative to it.
+ */
+export function resolveCursorkitCli() {
+    const override = process.env.FUSIONKIT_CURSORKIT_SERVE_CLI;
+    const serveCli = override !== undefined && override.length > 0
+        ? override
+        : require.resolve("@velum-labs/cursorkit");
+    const harnessCli = join(dirname(serveCli), "testing", "cli.js");
+    return { serveCli, harnessCli };
+}

package/dist/harness.d.ts CHANGED Viewed

@@ -190,6 +190,13 @@ export type CandidateHardeningMetadata = {
         leak_count: number;
     };
 };
+/**
+ * Serialize hardening metadata as a `JsonValue`. The shape is JSON-compatible by
+ * construction, but TypeScript cannot prove an object type with optional members
+ * satisfies the `JsonValue` index signature, so this typed mapper does the
+ * conversion explicitly (omitting absent optionals) instead of an unchecked cast.
+ */
+export declare function hardeningToJson(hardening: CandidateHardeningMetadata): JsonValue;
 export type EnsembleRuntime = {
     id: string;
     environmentId?: string;

package/dist/harness.js CHANGED Viewed

@@ -1 +1,51 @@
-export {};
+/**
+ * Serialize hardening metadata as a `JsonValue`. The shape is JSON-compatible by
+ * construction, but TypeScript cannot prove an object type with optional members
+ * satisfies the `JsonValue` index signature, so this typed mapper does the
+ * conversion explicitly (omitting absent optionals) instead of an unchecked cast.
+ */
+export function hardeningToJson(hardening) {
+    return {
+        requested_isolation: hardening.requested_isolation,
+        actual_isolation: hardening.actual_isolation,
+        runtime: {
+            ...(hardening.runtime.image !== undefined ? { image: hardening.runtime.image } : {}),
+            ...(hardening.runtime.driver !== undefined ? { driver: hardening.runtime.driver } : {}),
+            ...(hardening.runtime.provider !== undefined ? { provider: hardening.runtime.provider } : {}),
+            ...(hardening.runtime.runtime !== undefined ? { runtime: hardening.runtime.runtime } : {}),
+            ...(hardening.runtime.snapshot_id !== undefined ? { snapshot_id: hardening.runtime.snapshot_id } : {}),
+            ...(hardening.runtime.sandbox_id !== undefined ? { sandbox_id: hardening.runtime.sandbox_id } : {}),
+            ...(hardening.runtime.image_digest !== undefined ? { image_digest: hardening.runtime.image_digest } : {}),
+            ...(hardening.runtime.runtime_digest !== undefined
+                ? { runtime_digest: hardening.runtime.runtime_digest }
+                : {}),
+            workdir: hardening.runtime.workdir
+        },
+        mount_policy: {
+            worktree_writable: hardening.mount_policy.worktree_writable,
+            read_only_caches: [...hardening.mount_policy.read_only_caches],
+            ignored_dirs: [...hardening.mount_policy.ignored_dirs]
+        },
+        network_policy: {
+            default_deny: hardening.network_policy.default_deny,
+            allow_hosts: [...hardening.network_policy.allow_hosts],
+            enforced: hardening.network_policy.enforced
+        },
+        cleanup: {
+            attempted: hardening.cleanup.attempted,
+            succeeded: hardening.cleanup.succeeded,
+            status: hardening.cleanup.status,
+            ...(hardening.cleanup.timed_out !== undefined ? { timed_out: hardening.cleanup.timed_out } : {}),
+            ...(hardening.cleanup.error !== undefined ? { error: hardening.cleanup.error } : {})
+        },
+        secret_absence: {
+            secret_names: [...hardening.secret_absence.secret_names],
+            secret_value_hashes: [...hardening.secret_absence.secret_value_hashes],
+            injected_env_names: [...hardening.secret_absence.injected_env_names],
+            scanned: hardening.secret_absence.scanned,
+            leaks_found: hardening.secret_absence.leaks_found,
+            scan_scope: [...hardening.secret_absence.scan_scope],
+            leak_count: hardening.secret_absence.leak_count
+        }
+    };
+}

package/dist/index.d.ts CHANGED Viewed

@@ -1,18 +1,14 @@
 export { createCommandHarness } from "./command.js";
 export type { CommandHarnessOptions } from "./command.js";
-export { claudeCodeHarness, claudeCodeHarnessCredentialSkipReason, createClaudeCodeHarness } from "./claude-code.js";
-export type { ClaudeCodeHarnessEnv, ClaudeCodeHarnessOptions } from "./claude-code.js";
-export { codexConfigToml, codexHarnessCredentialSkipReason, codexHarness, createCodexHarness } from "./codex.js";
-export type { CodexAmbientProvider, CodexApprovalPolicy, CodexConfigTomlInput, CodexExecInput, CodexExecResult, CodexExecRunner, CodexHarnessEnv, CodexHarnessOptions, CodexOpenAiCompatibleProvider, CodexProvider, CodexResponsesProvider, CodexSandboxMode } from "./codex.js";
+export { resolveCursorkitCli } from "./cursorkit-path.js";
+export type { CursorkitCli } from "./cursorkit-path.js";
 export { createArtifactStore } from "./artifacts.js";
 export type { ArtifactStore } from "./artifacts.js";
-export { createHarnessCapabilityMatrix, harnessDashboard, runHarnessSmokeDashboard } from "./dashboard.js";
-export type { HarnessAdapterReadiness, HarnessAvailability, HarnessCapabilityMatrix, HarnessCapabilityMatrixRow, HarnessCapabilityTarget, HarnessLiveSmokeTarget, HarnessSmokeDashboard, HarnessSmokeDashboardOptions, HarnessSmokeOutcome, HarnessSmokePurpose, HarnessSmokeRecord } from "./dashboard.js";
 export { createMockJudgeSynthesizer } from "./judge.js";
 export type { JudgeCandidateEvidence, JudgeInput, JudgePatch, JudgeRepairInput, JudgeSynthesizer, JudgeSynthesisOutput, JudgeVerificationInput, MockJudgeSynthesizerOptions, SynthesisFailureSummary, SynthesisRepairAttempt, SynthesisVerificationResult } from "./judge.js";
 export { ensemble, runEnsemble } from "./run.js";
-export { createFusionKitJudgeSynthesizer, runFusionPanels, runUnifiedHarnessE2E } from "./unified.js";
-export type { CursorHarnessRunnerInput, CursorHarnessRunnerResult, FusionPanelOptions, UnifiedHarnessE2EOptions, UnifiedHarnessE2EResult, UnifiedHarnessKind, UnifiedHarnessMatrixResult } from "./unified.js";
+export { createFusionKitJudgeSynthesizer, runFusionPanels, runUnifiedHarnessE2E, setToolHarnessProvider } from "./unified.js";
+export type { CursorHarnessRunnerInput, CursorHarnessRunnerResult, FusionPanelOptions, ToolHarnessProvider, ToolHarnessResolveOptions, UnifiedHarnessE2EOptions, UnifiedHarnessE2EResult, UnifiedHarnessKind, UnifiedHarnessMatrixResult } from "./unified.js";
 export { ambientTraceId, emitTrace, getTraceEmitter, newSpanId, newTraceId, TRACE_CANDIDATE_HEADER, TRACE_ID_HEADER, TRACE_PARENT_SPAN_HEADER, TRACE_SPAN_HEADER, TraceEmitter } from "./trace.js";
 export type { EmitInput, FusionTraceComponent, FusionTraceEvent, FusionTraceEventType } from "./trace.js";
 export { runJudgeSynthesis } from "./synthesis.js";
@@ -27,4 +23,5 @@ export type { FusionKitToolExecutionBatch, FusionKitToolExecutionRequest, Fusion
 export type { CandidateCommandIsolationInput, CandidateCommandIsolationResult } from "./isolation.js";
 export { cleanupCandidateWorktree, cleanupWorktreePlan, createWorktreePlan, defaultOutputRoot, diffCandidateWorktree, sealCandidateWorktree } from "./worktree.js";
 export type { CandidateWorktree, WorktreePlan } from "./worktree.js";
+export { hardeningToJson } from "./harness.js";
 export type { EnsembleCandidateSummary, EnsembleDescriptor, EnsembleJudge, EnsembleModel, EnsemblePolicy, EnsembleRunResult, EnsembleRuntime, CandidateContainerDriver, CandidateContainerDriverInput, CandidateContainerDriverResult, CandidateHardeningMetadata, CandidateIsolationConfig, CandidateIsolationKind, CandidateIsolationMountPolicy, CandidateIsolationNetworkPolicy, CandidateIsolationSecretPolicy, HarnessAdapter, HarnessArtifact, HarnessCapabilities, HarnessCandidateOutput, HarnessCollectInput, HarnessPrepareInput, HarnessRunInput, HarnessToolRecord, ReviewEvidence, EnsembleRunSummary, VerificationProfile } from "./harness.js";

package/dist/index.js CHANGED Viewed

@@ -1,11 +1,9 @@
 export { createCommandHarness } from "./command.js";
-export { claudeCodeHarness, claudeCodeHarnessCredentialSkipReason, createClaudeCodeHarness } from "./claude-code.js";
-export { codexConfigToml, codexHarnessCredentialSkipReason, codexHarness, createCodexHarness } from "./codex.js";
+export { resolveCursorkitCli } from "./cursorkit-path.js";
 export { createArtifactStore } from "./artifacts.js";
-export { createHarnessCapabilityMatrix, harnessDashboard, runHarnessSmokeDashboard } from "./dashboard.js";
 export { createMockJudgeSynthesizer } from "./judge.js";
 export { ensemble, runEnsemble } from "./run.js";
-export { createFusionKitJudgeSynthesizer, runFusionPanels, runUnifiedHarnessE2E } from "./unified.js";
+export { createFusionKitJudgeSynthesizer, runFusionPanels, runUnifiedHarnessE2E, setToolHarnessProvider } from "./unified.js";
 export { ambientTraceId, emitTrace, getTraceEmitter, newSpanId, newTraceId, TRACE_CANDIDATE_HEADER, TRACE_ID_HEADER, TRACE_PARENT_SPAN_HEADER, TRACE_SPAN_HEADER, TraceEmitter } from "./trace.js";
 export { runJudgeSynthesis } from "./synthesis.js";
 export { createMockHarness } from "./mock.js";
@@ -13,3 +11,4 @@ export { createToolExecutor, registerDemoTools, sideEffectsForTool } from "./too
 export { executeFusionKitToolBatch, FusionKitToolExecutorClient, FusionKitToolExecutorClientError, FusionKitToolExecutorError, startFusionKitToolExecutorServer } from "./external-executor.js";
 export { createCliContainerDriver, runCandidateCommandWithIsolation, secretAbsenceMetadata, secretValueHash } from "./isolation.js";
 export { cleanupCandidateWorktree, cleanupWorktreePlan, createWorktreePlan, defaultOutputRoot, diffCandidateWorktree, sealCandidateWorktree } from "./worktree.js";
+export { hardeningToJson } from "./harness.js";

package/dist/run.js CHANGED Viewed

@@ -1,5 +1,6 @@
 import { assertHarnessCandidateRecordV1, assertHarnessRunRequestV1, assertHarnessRunResultV1, MODEL_FUSION_SCHEMA_BUNDLE_HASH, requestHash } from "@fusionkit/protocol";
 import { createArtifactStore } from "./artifacts.js";
+import { hardeningToJson } from "./harness.js";
 import { runJudgeSynthesis } from "./synthesis.js";
 import { cleanupWorktreePlan, createWorktreePlan, defaultOutputRoot, diffCandidateWorktree, sealCandidateWorktree } from "./worktree.js";
 const PRODUCER_GIT_SHA = "0".repeat(40);
@@ -99,7 +100,7 @@ function candidateMetadata(output, descriptor, worktree) {
     }
     Object.assign(metadata, output.metadata ?? {});
     if (metadata.hardening === undefined) {
-        metadata.hardening = fallbackCandidateHardening(descriptor);
+        metadata.hardening = hardeningToJson(fallbackCandidateHardening(descriptor));
     }
     if (descriptor.reviewEvidence !== undefined) {
         metadata.review_evidence_attached = true;

package/dist/test/ensemble.test.js CHANGED Viewed

@@ -5,9 +5,7 @@ import { join } from "node:path";
 import { test } from "node:test";
 import { assertJudgeSynthesisRecordV1, assertHarnessCandidateRecordV1, assertHarnessRunRequestV1, assertHarnessRunResultV1, MODEL_FUSION_SCHEMA_BUNDLE_HASH, requestHash, responseHash } from "@fusionkit/protocol";
 import { gitText } from "@fusionkit/workspace";
-import { claudeCodeHarness, claudeCodeHarnessCredentialSkipReason } from "../claude-code.js";
 import { createCommandHarness } from "../command.js";
-import { codexConfigToml, codexHarness, codexHarnessCredentialSkipReason } from "../codex.js";
 import { createMockJudgeSynthesizer } from "../judge.js";
 import { createMockHarness } from "../mock.js";
 import { runEnsemble } from "../run.js";
@@ -88,10 +86,6 @@ function addFilePatch(path, content) {
         ""
     ].join("\n");
 }
-function emptyCodexHome() {
-    const path = mkdtempSync(join(tmpdir(), "ensemble-codex-empty-home-"));
-    return { path, cleanup: () => rmSync(path, { recursive: true, force: true }) };
-}
 test("mock adapter runs N candidates and emits valid model-fusion records", async () => {
     const result = await runEnsemble(descriptor({
         harness: createMockHarness({
@@ -128,227 +122,6 @@ test("command adapter records command output, artifact, tool record, and verific
         "exec_ensemble_test_command_0"
     ]);
 });
-test("claude-code adapter can replace mock and skip clearly without credentials", async () => {
-    const result = await runEnsemble(descriptor({
-        models: [{ id: "claude", model: "claude-sonnet-4-6" }],
-        harness: claudeCodeHarness({ env: {} })
-    }));
-    assert.equal(result.candidates.length, 1);
-    assert.equal(result.harnessRunResult.status, "skipped");
-    assert.equal(result.candidates[0]?.status, "skipped");
-    assert.equal(result.candidates[0]?.error?.kind, "capability_missing");
-    assert.match(result.candidates[0]?.error?.message ?? "", /missing Claude Code credential/);
-    assert.match(result.summary?.candidates[0]?.verification?.evidence[0] ?? "", /missing Claude/);
-});
-test("claude-code adapter delegates through a session backend from a generic descriptor", async () => {
-    const repo = makeRepo();
-    const seen = {};
-    const backend = {
-        isolation: "vercel-sandbox",
-        supports: () => true,
-        execute: async (input) => {
-            seen.agentKind = input.contract.agent.kind;
-            seen.env = input.execution.env;
-            seen.repoDir = input.repoDir;
-            assert.equal(input.contract.isolation, "vercel-sandbox");
-            assert.equal(input.contract.execution?.kind, "agent");
-            assert.equal(input.secrets.length, 0);
-            writeFileSync(join(input.repoDir, "CLAUDE_RESULT.md"), "fake claude result\n");
-            input.emit({
-                type: "command.executed",
-                argvHash: requestHash({ adapter: "claude-code" }),
-                exitCode: 0
-            });
-            return { exitCode: 0, log: Buffer.from("fake claude transcript") };
-        }
-    };
-    try {
-        const result = await runEnsemble(descriptor({
-            models: [{ id: "claude", model: "claude-sonnet-4-6" }],
-            harness: claudeCodeHarness({
-                env: {
-                    ANTHROPIC_API_KEY: "sk-ant-test",
-                    VERCEL_TOKEN: "vercel-test"
-                },
-                backend
-            }),
-            workspace: repo.repo,
-            baseGitSha: repo.head,
-            outputRoot: repo.outputRoot,
-            cleanupWorktrees: true
-        }));
-        assert.equal(result.harnessRunResult.status, "succeeded");
-        assert.equal(result.candidates[0]?.status, "succeeded");
-        assert.equal(seen.agentKind, "claude-code");
-        assert.equal(seen.env?.ANTHROPIC_API_KEY, "sk-ant-test");
-        assert.equal(Object.hasOwn(seen.env ?? {}, "VERCEL_TOKEN"), false);
-        assert.notEqual(seen.repoDir, repo.repo);
-        assert.ok(result.artifacts.some((artifact) => artifact.kind === "patch"));
-        assert.match(result.candidates[0]?.metadata?.adapter, /claude-code/);
-    }
-    finally {
-        repo.cleanup();
-    }
-});
-test("smoke: claude-code adapter runs live when credentials are available", { skip: liveClaudeSmokeSkipReason() }, async () => {
-    const repo = makeRepo();
-    try {
-        const result = await runEnsemble(descriptor({
-            id: "claude_smoke",
-            models: [{ id: "claude", model: "claude-sonnet-4-6" }],
-            harness: claudeCodeHarness(),
-            runtime: {
-                id: "vercel-sandbox",
-                isolation: {
-                    kind: "microvm",
-                    networkPolicy: {
-                        defaultDeny: true,
-                        allowHosts: [
-                            "registry.npmjs.org",
-                            "api.anthropic.com",
-                            "ai-gateway.vercel.sh"
-                        ]
-                    }
-                }
-            },
-            policy: {
-                id: "claude-smoke-policy",
-                allowedTools: ["read_file"],
-                sideEffects: "read_only",
-                timeoutMs: 180_000
-            },
-            prompt: "Read README.md if present, then reply exactly CLAUDE_LIVE_SMOKE_OK. Do not modify files.",
-            workspace: repo.repo,
-            baseGitSha: repo.head,
-            outputRoot: repo.outputRoot,
-            cleanupWorktrees: true
-        }));
-        assertHarnessRunResultV1(result.harnessRunResult);
-        assert.equal(result.harnessRunResult.status, "succeeded");
-        assert.equal(result.candidates[0]?.status, "succeeded");
-    }
-    finally {
-        repo.cleanup();
-    }
-});
-test("codex config declares a Responses provider without touching Cursor records", () => {
-    const toml = codexConfigToml({
-        model: "gpt-5.5-codex",
-        sandboxMode: "workspace-write",
-        approvalPolicy: "never",
-        provider: {
-            providerId: "warrant-local",
-            name: "Warrant Local",
-            baseUrl: "https://gateway.example.com/v1/responses",
-            apiKeyEnvName: "WARRANT_CODEX_API_KEY",
-            requiresOpenAiAuth: true
-        }
-    });
-    assert.match(toml, /model = "gpt-5\.5-codex"/);
-    assert.match(toml, /model_provider = "warrant-local"/);
-    assert.match(toml, /\[model_providers\.warrant-local\]/);
-    assert.match(toml, /base_url = "https:\/\/gateway\.example\.com\/v1"/);
-    assert.match(toml, /wire_api = "responses"/);
-    assert.match(toml, /env_key = "WARRANT_CODEX_API_KEY"/);
-    assert.equal(toml.includes("cursor"), false);
-});
-test("codex adapter emits schema-valid skipped output without credentials", async () => {
-    const codexHome = emptyCodexHome();
-    try {
-        const result = await runEnsemble(descriptor({
-            models: [{ id: "codex", model: "gpt-5.5-codex" }],
-            harness: codexHarness({
-                env: { CODEX_HOME: codexHome.path },
-                provider: { kind: "ambient" }
-            })
-        }));
-        assertHarnessRunResultV1(result.harnessRunResult);
-        assert.equal(result.harnessRunResult.status, "skipped");
-        assert.equal(result.candidates[0]?.status, "skipped");
-        assert.equal(result.candidates[0]?.error?.kind, "capability_missing");
-        assert.match(result.candidates[0]?.error?.message ?? "", /Codex credentials are absent/);
-        assert.match(result.summary?.candidates[0]?.verification?.evidence[0] ?? "", /Codex credentials/);
-    }
-    finally {
-        codexHome.cleanup();
-    }
-});
-test("codex adapter runs through an injected Responses runner and records evidence", async () => {
-    const calls = [];
-    const result = await runEnsemble(descriptor({
-        models: [{ id: "codex", model: "gpt-5.5-codex" }],
-        harness: codexHarness({
-            env: {},
-            provider: {
-                kind: "responses",
-                baseUrl: "http://127.0.0.1:8787/v1/responses",
-                apiKey: "inline-test-key",
-                requiresOpenAiAuth: true,
-                providerId: "local-responses"
-            },
-            runner: (input) => {
-                calls.push(input);
-                const codexHome = input.env.CODEX_HOME;
-                assert.ok(codexHome);
-                const config = readFileSync(join(codexHome, "config.toml"), "utf8");
-                assert.match(config, /model_provider = "local-responses"/);
-                assert.match(config, /base_url = "http:\/\/127\.0\.0\.1:8787\/v1"/);
-                assert.match(config, /wire_api = "responses"/);
-                assert.match(config, /env_key = "WARRANT_CODEX_PROVIDER_API_KEY"/);
-                assert.equal(input.env.WARRANT_CODEX_PROVIDER_API_KEY, "inline-test-key");
-                return {
-                    stdout: '{"type":"message","content":"codex-ok"}\n',
-                    stderr: "",
-                    exitCode: 0
-                };
-            }
-        })
-    }));
-    assert.equal(calls.length, 1);
-    assert.deepEqual(calls[0]?.args.slice(0, 3), [
-        "exec",
-        "--json",
-        "--skip-git-repo-check"
-    ]);
-    assert.equal(result.harnessRunResult.status, "succeeded");
-    assert.equal(result.candidates[0]?.status, "succeeded");
-    assert.equal(result.toolRecords[0]?.status, "succeeded");
-    assert.match(result.candidates[0]?.metadata?.adapter, /codex/);
-});
-function liveClaudeSmokeSkipReason() {
-    if (process.env.WARRANT_CLAUDE_SMOKE !== "1") {
-        return "set WARRANT_CLAUDE_SMOKE=1 plus Claude Code credentials to run the live Claude Code smoke";
-    }
-    return claudeCodeHarnessCredentialSkipReason() ?? false;
-}
-function liveCodexSmokeSkipReason() {
-    if (process.env.WARRANT_CODEX_SMOKE !== "1") {
-        return "set WARRANT_CODEX_SMOKE=1 plus Codex credentials to run the live Codex smoke";
-    }
-    return codexHarnessCredentialSkipReason() ?? false;
-}
-test("codex adapter live smoke is credential-gated", { skip: liveCodexSmokeSkipReason() }, async () => {
-    const repo = makeRepo();
-    try {
-        const result = await runEnsemble(descriptor({
-            prompt: "Read README.md if present, then reply exactly CODEX_LIVE_SMOKE_OK. Do not modify files.",
-            models: [{ id: "codex", model: process.env.WARRANT_CODEX_SMOKE_MODEL ?? "gpt-5.5-codex" }],
-            harness: codexHarness({
-                timeoutMs: 60_000,
-                sandboxMode: "read-only",
-                approvalPolicy: "never"
-            }),
-            workspace: repo.repo,
-            baseGitSha: repo.head,
-            outputRoot: repo.outputRoot
-        }));
-        assertHarnessRunResultV1(result.harnessRunResult);
-        assert.notEqual(result.harnessRunResult.status, "skipped");
-    }
-    finally {
-        repo.cleanup();
-    }
-});
 test("command adapter records optional container hardening metadata", async () => {
     const driver = {
         id: "fake-ensemble-container",

package/dist/unified.d.ts CHANGED Viewed

@@ -1,7 +1,33 @@
 import type { JsonValue, ModelFusionStatus } from "@fusionkit/protocol";
-import type { EnsembleModel, EnsembleRunResult } from "./harness.js";
+import type { EnsembleDescriptor, EnsembleModel, EnsembleRunResult, HarnessAdapter } from "./harness.js";
 import type { JudgeSynthesizer } from "./judge.js";
 export type UnifiedHarnessKind = "mock" | "command" | "agent" | "codex" | "claude-code" | "cursor-acp" | "cursor-desktop";
+/**
+ * Options the unified runner passes to a tool's harness factory. The per-tool
+ * packages map these onto their own harness options (provider base URL, etc.).
+ */
+export type ToolHarnessResolveOptions = {
+    fusionBackendUrl: string;
+    fusionApiKey?: string;
+    timeoutMs?: number;
+};
+/**
+ * Provides everything ensemble needs about a tool-backed harness kind (codex,
+ * claude-code, cursor-*) without ensemble depending on any per-tool package. The
+ * fusionkit CLI registers one (built from its tool registry) via
+ * {@link setToolHarnessProvider}; without it, requesting a tool harness kind
+ * throws a clear error.
+ */
+export type ToolHarnessProvider = {
+    adapter(kind: UnifiedHarnessKind, options: ToolHarnessResolveOptions): HarnessAdapter;
+    sideEffects(kind: UnifiedHarnessKind): EnsembleDescriptor["policy"]["sideEffects"];
+    responseShape(kind: UnifiedHarnessKind): string;
+};
+/**
+ * Register the provider that resolves tool-backed harness kinds. The fusionkit
+ * CLI wires this at startup from its tool registry.
+ */
+export declare function setToolHarnessProvider(provider: ToolHarnessProvider | undefined): void;
 export type UnifiedHarnessMatrixResult = {
     harness: UnifiedHarnessKind;
     modelIds: string[];
@@ -26,7 +52,6 @@ export type CursorHarnessRunnerInput = {
     repo: string;
     outDir: string;
     timeoutMs?: number;
-    cursorKitDir?: string;
 };
 export type CursorHarnessRunnerResult = {
     status: ModelFusionStatus;
@@ -46,7 +71,6 @@ export type UnifiedHarnessE2EOptions = {
     command?: string;
     timeoutMs?: number;
     judgeModel?: string;
-    cursorKitDir?: string;
     cursorRunner?: (input: CursorHarnessRunnerInput) => Promise<CursorHarnessRunnerResult>;
     /**
      * Per-candidate model backend URLs keyed by `EnsembleModel.id`. When a

package/dist/unified.js CHANGED Viewed

@@ -4,11 +4,32 @@ import { join, resolve } from "node:path";
 import { newSpanId, TRACE_ID_HEADER, TRACE_SPAN_HEADER } from "@fusionkit/protocol";
 import { gitText } from "@fusionkit/workspace";
 import { createAgentHarness } from "./agent.js";
-import { claudeCodeHarness } from "./claude-code.js";
 import { createCommandHarness } from "./command.js";
-import { codexHarness } from "./codex.js";
+import { resolveCursorkitCli } from "./cursorkit-path.js";
 import { createMockHarness } from "./mock.js";
 import { runEnsemble } from "./run.js";
+let toolHarnessProvider;
+/**
+ * Register the provider that resolves tool-backed harness kinds. The fusionkit
+ * CLI wires this at startup from its tool registry.
+ */
+export function setToolHarnessProvider(provider) {
+    toolHarnessProvider = provider;
+}
+function requireToolHarnessProvider(kind) {
+    if (toolHarnessProvider === undefined) {
+        throw new Error(`no tool harness provider registered for harness kind "${kind}"; ` +
+            "the fusionkit CLI wires this via setToolHarnessProvider (build the tool registry first).");
+    }
+    return toolHarnessProvider;
+}
+function resolveToolAdapter(kind, options) {
+    return requireToolHarnessProvider(kind).adapter(kind, {
+        fusionBackendUrl: normalizeFusionBackendUrl(options.fusionBackendUrl),
+        ...(options.fusionApiKey !== undefined ? { fusionApiKey: options.fusionApiKey } : {}),
+        ...(options.timeoutMs !== undefined ? { timeoutMs: options.timeoutMs } : {})
+    });
+}
 function normalizeFusionBackendUrl(value) {
     return value.replace(/\/+$/, "");
 }
@@ -30,7 +51,7 @@ function sideEffectsForHarness(kind) {
         case "claude-code":
         case "cursor-acp":
         case "cursor-desktop":
-            return "writes_workspace";
+            return requireToolHarnessProvider(kind).sideEffects(kind);
         default: {
             const exhausted = kind;
             throw new Error(`unsupported unified harness: ${String(exhausted)}`);
@@ -72,19 +93,10 @@ function harnessAdapter(kind, options) {
             });
         }
         case "codex":
-            return codexHarness({
-                timeoutMs: options.timeoutMs,
-                provider: {
-                    kind: "openai-compatible",
-                    baseUrl: normalizeFusionBackendUrl(options.fusionBackendUrl),
-                    ...(options.fusionApiKey ? { apiKey: options.fusionApiKey } : {})
-                }
-            });
         case "claude-code":
-            return claudeCodeHarness({ timeoutMs: options.timeoutMs });
         case "cursor-acp":
         case "cursor-desktop":
-            throw new Error(`${kind} runs through the Cursor harness adapter path`);
+            return resolveToolAdapter(kind, options);
         default: {
             const exhausted = kind;
             throw new Error(`unsupported unified harness: ${String(exhausted)}`);
@@ -100,12 +112,10 @@ function responseShapeFor(kind) {
             return ("Respond to the user in the natural shape the request calls for: a direct answer, " +
                 "a plan, or the concrete code change. Reply in first person as the assistant.");
         case "codex":
-            return "Return a Codex-style result summary with patch and verification evidence.";
         case "claude-code":
-            return "Return a Claude Code-style transcript summary with patch/worktree evidence.";
         case "cursor-acp":
         case "cursor-desktop":
-            return "Return text suitable for Cursor ACP session/update plus route evidence notes.";
+            return requireToolHarnessProvider(kind).responseShape(kind);
         default: {
             const exhausted = kind;
             throw new Error(`unsupported unified harness: ${String(exhausted)}`);
@@ -304,17 +314,10 @@ function statusForResult(result) {
     return result.failureSummary ? "failed" : result.harnessRunResult.status;
 }
 async function defaultCursorRunner(input) {
-    if (!input.cursorKitDir) {
-        return {
-            status: "skipped",
-            message: "Cursorkit directory not configured",
-            details: { reason: "cursor_kit_dir_missing" }
-        };
-    }
+    const { harnessCli } = resolveCursorkitCli();
     const suite = input.kind === "cursor-acp" ? "acp" : "desktop-route";
     const args = [
-        "test:harness",
-        "--",
+        harnessCli,
         "--suite",
         suite,
         "--base-url",
@@ -328,8 +331,8 @@ async function defaultCursorRunner(input) {
     ];
     mkdirSync(input.outDir, { recursive: true });
     return await new Promise((resolveResult) => {
-        const child = spawn("pnpm", args, {
-            cwd: input.cursorKitDir,
+        const child = spawn(process.execPath, args, {
+            cwd: input.outDir,
             stdio: ["ignore", "pipe", "pipe"]
         });
         let stdout = "";
@@ -360,8 +363,7 @@ async function runCursorHarness(kind, options) {
         fusionBackendUrl: options.fusionBackendUrl,
         repo: options.repo,
         outDir: join(options.outputRoot, `${kind}-${model.id}`),
-        timeoutMs: options.timeoutMs,
-        cursorKitDir: options.cursorKitDir
+        timeoutMs: options.timeoutMs
     })));
     const failed = perModel.find((result) => result.status === "failed");
     const skipped = perModel.every((result) => result.status === "skipped");
@@ -385,7 +387,10 @@ export async function runUnifiedHarnessE2E(options) {
     mkdirSync(outputRoot, { recursive: true });
     const results = [];
     for (const kind of options.harnesses) {
-        if (kind === "cursor-acp" || kind === "cursor-desktop") {
+        if ((kind === "cursor-acp" || kind === "cursor-desktop") &&
+            options.cursorRunner !== undefined) {
+            // Explicit probe runner: drive the Cursorkit harness suite and record a
+            // route/transcript probe instead of producing real ensemble candidates.
             results.push(await runCursorHarness(kind, options));
             continue;
         }

package/package.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "name": "@fusionkit/ensemble",
   "private": false,
-  "version": "0.1.4",
+  "version": "0.1.6",
   "repository": {
     "type": "git",
     "url": "git+https://github.com/velum-labs/handoffkit.git",
@@ -25,11 +25,12 @@
     "provenance": true
   },
   "dependencies": {
-    "@fusionkit/adapter-ai-sdk": "0.1.4",
-    "@fusionkit/model-gateway": "0.1.4",
-    "@fusionkit/protocol": "0.1.4",
-    "@fusionkit/runner": "0.1.4",
-    "@fusionkit/session-harness": "0.1.4",
-    "@fusionkit/workspace": "0.1.4"
+    "@velum-labs/cursorkit": "0.1.2",
+    "@fusionkit/adapter-ai-sdk": "0.1.6",
+    "@fusionkit/model-gateway": "0.1.6",
+    "@fusionkit/protocol": "0.1.6",
+    "@fusionkit/session-harness": "0.1.6",
+    "@fusionkit/runner": "0.1.6",
+    "@fusionkit/workspace": "0.1.6"
   }
 }

package/dist/claude-code.d.ts DELETED Viewed

@@ -1,25 +0,0 @@
-import type { NetworkPolicy } from "@fusionkit/protocol";
-import type { SessionBackend } from "@fusionkit/runner";
-import type { ClaudeCodeBindingOptions } from "@fusionkit/session-harness";
-import type { HarnessAdapter } from "./harness.js";
-export type ClaudeCodeHarnessEnv = Record<string, string | undefined>;
-export type ClaudeCodeHarnessOptions = ClaudeCodeBindingOptions & {
-    id?: string;
-    /** Defaults to `process.env`; tests can pass `{}` for deterministic skips. */
-    env?: ClaudeCodeHarnessEnv;
-    /** Already-released secret values forwarded through the session backend seam. */
-    secrets?: {
-        name: string;
-        value: string;
-    }[];
-    /** Test/extension seam. Defaults to `aiSdkHarnessBackend(...)`. */
-    backend?: SessionBackend;
-    pool?: string;
-    network?: NetworkPolicy;
-    timeoutMs?: number;
-    logMaxBytes?: number;
-    skipWhenUnavailable?: boolean;
-};
-export declare function claudeCodeHarnessCredentialSkipReason(env?: ClaudeCodeHarnessEnv, options?: ClaudeCodeHarnessOptions): string | undefined;
-export declare function createClaudeCodeHarness(options?: ClaudeCodeHarnessOptions): HarnessAdapter;
-export declare function claudeCodeHarness(options?: ClaudeCodeHarnessOptions): HarnessAdapter;