npm - @botbotgo/agent-harness - Versions diffs - 0.0.91 → 0.0.93 - Mend

@botbotgo/agent-harness 0.0.91 → 0.0.93

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (39) hide show

package/README.md +138 -31
package/README.zh.md +93 -28
package/dist/benchmark/upstream-runtime-ab-benchmark.d.ts +1 -1
package/dist/benchmark/upstream-runtime-ab-benchmark.js +2 -1
package/dist/config/workflows/langgraph-workflows.yaml +292 -0
package/dist/contracts/types.d.ts +8 -3
package/dist/init-project.js +7 -7
package/dist/package-version.d.ts +1 -1
package/dist/package-version.js +1 -1
package/dist/runtime/agent-runtime-adapter.d.ts +48 -1
package/dist/runtime/agent-runtime-adapter.js +1001 -50
package/dist/runtime/harness.d.ts +2 -0
package/dist/runtime/harness.js +55 -11
package/dist/runtime/inventory.d.ts +1 -1
package/dist/runtime/inventory.js +1 -1
package/dist/runtime/langgraph-presets.d.ts +23 -0
package/dist/runtime/langgraph-presets.js +165 -0
package/dist/runtime/policy-engine.js +0 -5
package/dist/runtime/support/compiled-binding.d.ts +4 -1
package/dist/runtime/support/compiled-binding.js +24 -2
package/dist/runtime/support/harness-support.js +3 -3
package/dist/runtime/support/runtime-entry.js +1 -1
package/dist/workspace/agent-binding-compiler.js +82 -8
package/dist/workspace/compile.js +1 -3
package/dist/workspace/object-loader.js +47 -6
package/dist/workspace/support/agent-capabilities.js +2 -2
package/dist/workspace/support/workspace-ref-utils.d.ts +2 -1
package/dist/workspace/support/workspace-ref-utils.js +21 -0
package/dist/workspace/validate.js +1 -1
package/package.json +2 -2
/package/dist/config/{backends.yaml → catalogs/backends.yaml} +0 -0
/package/dist/config/{embedding-models.yaml → catalogs/embedding-models.yaml} +0 -0
/package/dist/config/{mcp.yaml → catalogs/mcp.yaml} +0 -0
/package/dist/config/{models.yaml → catalogs/models.yaml} +0 -0
/package/dist/config/{stores.yaml → catalogs/stores.yaml} +0 -0
/package/dist/config/{tools.yaml → catalogs/tools.yaml} +0 -0
/package/dist/config/{vector-stores.yaml → catalogs/vector-stores.yaml} +0 -0
/package/dist/config/{runtime-memory.yaml → runtime/runtime-memory.yaml} +0 -0
/package/dist/config/{workspace.yaml → runtime/workspace.yaml} +0 -0

package/dist/config/workflows/langgraph-workflows.yaml ADDED Viewed

@@ -0,0 +1,292 @@
+# agent-harness feature: schema version for this declarative config object.
+apiVersion: agent-harness/v1alpha1
+# agent-harness feature: catalog of reusable LangGraph-shaped workflow resources.
+kind: LangGraphWorkflows
+spec:
+  - id: default
+    entryNode: planner
+    nodes:
+      - id: planner
+        kind: planner
+        prompt: >-
+          You are the workflow planner. Produce a concise plan for the user request
+          before execution starts.
+      - id: executor
+        kind: executor
+      - id: reviewer
+        kind: reviewer
+        prompt: >-
+          Review the current result, call out missing verification or obvious gaps,
+          and state whether the work looks sufficient.
+      - id: replanner
+        kind: replanner
+        prompt: >-
+          Refine the plan based on the reviewer feedback and current result.
+          Return only the updated plan.
+      - id: finalizer
+        kind: finalizer
+        prompt: >-
+          Rewrite the current result into a concise user-facing final answer.
+          Preserve facts and caveats.
+    edges:
+      - from: planner
+        to: executor
+      - from: executor
+        to: reviewer
+        when: has_result
+      - from: reviewer
+        to: finalizer
+        when: review_ok
+      - from: reviewer
+        to: replanner
+        when: review_incomplete
+      - from: replanner
+        to: executor
+        when: has_plan
+  - id: react
+    entryNode: executor
+    nodes:
+      - id: executor
+        kind: executor
+    edges: []
+  - id: prompt-chaining
+    entryNode: planner
+    nodes:
+      - id: planner
+        kind: planner
+        prompt: >-
+          You are the workflow planner. Produce a concise execution plan for the user request
+          before execution starts.
+      - id: executor
+        kind: executor
+      - id: finalizer
+        kind: finalizer
+        prompt: >-
+          Rewrite the current result into a concise user-facing final answer.
+          Preserve facts and caveats.
+    edges:
+      - from: planner
+        to: executor
+      - from: executor
+        to: finalizer
+        when: has_result
+  - id: routing
+    entryNode: planner
+    nodes:
+      - id: planner
+        kind: planner
+        prompt: >-
+          You are the workflow planner. Produce a concise execution plan for the user request
+          before execution starts.
+      - id: specialist
+        kind: specialist
+        specialist: specialist
+      - id: finalizer
+        kind: finalizer
+        prompt: >-
+          Rewrite the current result into a concise user-facing final answer.
+          Preserve facts and caveats.
+    edges:
+      - from: planner
+        to: specialist
+      - from: specialist
+        to: finalizer
+        when: has_result
+  - id: parallelization
+    entryNode: planner
+    nodes:
+      - id: planner
+        kind: planner
+        prompt: >-
+          You are the workflow planner. Produce a concise execution plan for the user request
+          before execution starts.
+      - id: specialist
+        kind: specialist
+        specialist: specialist
+      - id: reviewer
+        kind: reviewer
+        prompt: >-
+          Review the current result, call out missing verification or obvious gaps,
+          and state whether the work looks sufficient.
+      - id: finalizer
+        kind: finalizer
+        prompt: >-
+          Rewrite the current result into a concise user-facing final answer.
+          Preserve facts and caveats.
+    edges:
+      - from: planner
+        to: specialist
+      - from: specialist
+        to: reviewer
+        when: has_result
+      - from: reviewer
+        to: finalizer
+        when: review_ok
+  - id: plan-execute
+    entryNode: planner
+    nodes:
+      - id: planner
+        kind: planner
+        prompt: >-
+          You are the workflow planner. Produce a concise execution plan for the user request
+          before execution starts.
+      - id: executor
+        kind: executor
+      - id: finalizer
+        kind: finalizer
+        prompt: >-
+          Rewrite the current result into a concise user-facing final answer.
+          Preserve facts and caveats.
+    edges:
+      - from: planner
+        to: executor
+      - from: executor
+        to: finalizer
+        when: has_result
+  - id: review-loop
+    entryNode: planner
+    nodes:
+      - id: planner
+        kind: planner
+        prompt: >-
+          You are the workflow planner. Produce a concise plan for the user request
+          before execution starts.
+      - id: executor
+        kind: executor
+      - id: reviewer
+        kind: reviewer
+        prompt: >-
+          Review the current result, call out missing verification or obvious gaps,
+          and state whether the work looks sufficient.
+      - id: replanner
+        kind: replanner
+        prompt: >-
+          Refine the plan based on the reviewer feedback and current result.
+          Return only the updated plan.
+      - id: finalizer
+        kind: finalizer
+        prompt: >-
+          Rewrite the current result into a concise user-facing final answer.
+          Preserve facts and caveats.
+    edges:
+      - from: planner
+        to: executor
+      - from: executor
+        to: reviewer
+        when: has_result
+      - from: reviewer
+        to: finalizer
+        when: review_ok
+      - from: reviewer
+        to: replanner
+        when: review_incomplete
+      - from: replanner
+        to: executor
+        when: has_plan
+  - id: evaluator-optimizer
+    entryNode: executor
+    nodes:
+      - id: executor
+        kind: executor
+      - id: reviewer
+        kind: reviewer
+        prompt: >-
+          Review the current result, call out missing verification or obvious gaps,
+          and state whether the work looks sufficient.
+      - id: replanner
+        kind: replanner
+        prompt: >-
+          Refine the plan based on the reviewer feedback and current result.
+          Return only the updated plan.
+      - id: finalizer
+        kind: finalizer
+        prompt: >-
+          Rewrite the current result into a concise user-facing final answer.
+          Preserve facts and caveats.
+    edges:
+      - from: executor
+        to: reviewer
+        when: has_result
+      - from: reviewer
+        to: finalizer
+        when: review_ok
+      - from: reviewer
+        to: replanner
+        when: review_incomplete
+      - from: replanner
+        to: executor
+        when: has_plan
+  - id: approval-gate
+    entryNode: planner
+    nodes:
+      - id: planner
+        kind: planner
+        prompt: >-
+          You are the workflow planner. Produce a concise execution plan for the user request
+          before execution starts.
+      - id: approval
+        kind: approval
+      - id: executor
+        kind: executor
+      - id: finalizer
+        kind: finalizer
+        prompt: >-
+          Rewrite the current result into a concise user-facing final answer.
+          Preserve facts and caveats.
+    edges:
+      - from: planner
+        to: approval
+      - from: approval
+        to: executor
+        when: approval_approved
+      - from: approval
+        to: executor
+        when: approval_edited
+      - from: executor
+        to: finalizer
+        when: has_result
+  - id: handoff
+    entryNode: specialist
+    nodes:
+      - id: specialist
+        kind: specialist
+        specialist: specialist
+      - id: finalizer
+        kind: finalizer
+        prompt: >-
+          Rewrite the current result into a concise user-facing final answer.
+          Preserve facts and caveats.
+    edges:
+      - from: specialist
+        to: finalizer
+        when: has_result
+  - id: orchestrator-workers
+    entryNode: planner
+    nodes:
+      - id: planner
+        kind: planner
+        prompt: >-
+          You are the workflow planner. Produce a concise plan for the user request
+          before execution starts.
+      - id: specialist
+        kind: specialist
+        specialist: specialist
+      - id: reviewer
+        kind: reviewer
+        prompt: >-
+          Review the current result, call out missing verification or obvious gaps,
+          and state whether the work looks sufficient.
+      - id: finalizer
+        kind: finalizer
+        prompt: >-
+          Rewrite the current result into a concise user-facing final answer.
+          Preserve facts and caveats.
+    edges:
+      - from: planner
+        to: specialist
+      - from: specialist
+        to: reviewer
+        when: has_result
+      - from: reviewer
+        to: finalizer
+        when: review_ok

package/dist/contracts/types.d.ts CHANGED Viewed

@@ -1,5 +1,8 @@
-export type ExecutionMode = "deepagent" | "langchain-v1";
+export type ExecutionMode = "deepagent" | "langchain-v1" | "langgraph";
 export declare const AUTO_AGENT_ID = "auto";
+export type RuntimeModelSlot = "routing" | "planning" | "execution" | "review" | "final";
+export type RuntimeModelRefMap = Partial<Record<RuntimeModelSlot, string>>;
+export type RuntimeModelMap = Partial<Record<RuntimeModelSlot, CompiledModel>>;
 export type RuntimeCapabilities = {
     delegation?: boolean;
     memory?: boolean;
@@ -8,6 +11,7 @@ export type RunState = "queued" | "claimed" | "running" | "waiting_for_approval"
 export type ParsedAgentObject = {
     id: string;
     executionMode: ExecutionMode;
+    runtimeModelRefs?: RuntimeModelRefMap;
     capabilities?: RuntimeCapabilities;
     description: string;
     modelRef: string;
@@ -200,7 +204,8 @@ export type CompiledAgentBinding = {
     harnessRuntime: {
         runRoot: string;
         workspaceRoot?: string;
-        runtimeEntry: boolean;
+        modelRefs?: RuntimeModelRefMap;
+        models?: RuntimeModelMap;
         capabilities?: RuntimeCapabilities;
         resilience?: Record<string, unknown>;
         checkpointer?: Record<string, unknown> | boolean;
@@ -239,7 +244,7 @@ export type ThreadSummary = {
     status: RunState;
 };
 export type SessionRecord = ThreadSummary;
-export type KnownHarnessEventType = "run.created" | "run.queued" | "run.dequeued" | "run.state.changed" | "run.resumed" | "approval.requested" | "approval.resolved" | "artifact.created" | "output.delta" | "reasoning.delta" | "runtime.health.changed" | "runtime.synthetic_fallback";
+export type KnownHarnessEventType = "run.created" | "run.queued" | "run.dequeued" | "run.state.changed" | "run.reviewed" | "run.resumed" | "approval.requested" | "approval.resolved" | "artifact.created" | "output.delta" | "reasoning.delta" | "runtime.health.changed" | "runtime.synthetic_fallback";
 export type HarnessEventType = KnownHarnessEventType | (string & {});
 export type HarnessEvent = {
     eventId: string;

package/dist/init-project.js CHANGED Viewed

@@ -43,7 +43,7 @@ function renderPackageJson(projectSlug, template) {
 }
 function renderReadme(displayName, projectSlug, options) {
     const webSearchLine = options.withWebSearch
-        ? `- ${options.provider} native web search enabled through \`config/tools.yaml\``
+        ? `- ${options.provider} native web search enabled through \`config/catalogs/tools.yaml\``
         : "- no provider-native web search by default";
     const providerEnvLine = options.provider === "openai" ? "export OPENAI_API_KEY=your_key_here\n" : "";
     const templateLine = options.template === "deep-research"
@@ -73,7 +73,7 @@ ${providerEnvLine}npm run start -- "Research the latest model serving stack for
 ## Customize
-- change \`config/models.yaml\` to switch models or providers
+- change \`config/catalogs/models.yaml\` to switch models or providers
 - add local \`tool({...})\` tools under \`resources/tools/\`
 - add product-specific skills under \`resources/skills/\`
 - edit the prompts in \`config/agents/\` to turn this into your own product
@@ -316,12 +316,12 @@ export async function initProject(projectRoot, projectName, options = {}) {
         [".gitignore", renderGitignore()],
         ["README.md", renderReadme(displayName, projectSlug, resolved)],
         ["src/run.mjs", renderRunScript(resolved)],
-        ["config/workspace.yaml", renderWorkspaceYaml()],
+        ["config/runtime/workspace.yaml", renderWorkspaceYaml()],
         ["config/agent-context.md", renderAgentContext(resolved)],
-        ["config/models.yaml", renderModelsYaml(resolved)],
-        ["config/runtime-memory.yaml", renderRuntimeMemoryYaml()],
-        ["config/backends.yaml", renderBackendsYaml()],
-        ["config/tools.yaml", renderToolsYaml(resolved)],
+        ["config/catalogs/models.yaml", renderModelsYaml(resolved)],
+        ["config/runtime/runtime-memory.yaml", renderRuntimeMemoryYaml()],
+        ["config/catalogs/backends.yaml", renderBackendsYaml()],
+        ["config/catalogs/tools.yaml", renderToolsYaml(resolved)],
         ["config/agents/research.yaml", renderResearchAgentYaml(resolved)],
         ["resources/package.json", renderResourcePackageJson(projectSlug)],
         ["resources/skills/deep-research/SKILL.md", renderSkill(resolved)],

package/dist/package-version.d.ts CHANGED Viewed

	@@ -1 +1 @@
1	- export declare const AGENT_HARNESS_VERSION = "0.0.90";
1	+ export declare const AGENT_HARNESS_VERSION = "0.0.92";

package/dist/package-version.js CHANGED Viewed

	@@ -1 +1 @@
1	- export const AGENT_HARNESS_VERSION = "0.0.90";
1	+ export const AGENT_HARNESS_VERSION = "0.0.92";

package/dist/runtime/agent-runtime-adapter.d.ts CHANGED Viewed

@@ -1,4 +1,4 @@
-import type { CompiledAgentBinding, MessageContent, RunResult, RuntimeAdapterOptions, TranscriptMessage } from "../contracts/types.js";
+import type { CompiledAgentBinding, CompiledModel, CompiledSubAgent, MessageContent, RunResult, RuntimeAdapterOptions, TranscriptMessage } from "../contracts/types.js";
 import { type RuntimeStreamChunk } from "./parsing/stream-event-parsing.js";
 type RunnableLike = {
     invoke: (input: unknown, config?: Record<string, unknown>) => Promise<unknown>;
@@ -19,10 +19,16 @@ export declare function materializeDeepAgentSkillSourcePaths(options: {
     ownerId: string;
     skillPaths?: string[];
 }): Promise<string[] | undefined>;
+export declare function shouldRelaxDeepAgentDelegationPrompt(model: CompiledModel | undefined, params: {
+    subagents?: CompiledSubAgent[];
+    generalPurposeAgent?: boolean;
+    taskDescription?: string;
+}): boolean;
 export declare class AgentRuntimeAdapter {
     private readonly options;
     private readonly modelCache;
     private readonly runnableCache;
+    private readonly langGraphSessions;
     constructor(options?: RuntimeAdapterOptions);
     private getModelCacheKey;
     private resolveBindingTimeout;
@@ -56,13 +62,53 @@ export declare class AgentRuntimeAdapter {
     private resolveDeepAgentAutomaticMiddleware;
     private resolveMiddleware;
     private resolveCheckpointer;
+    private resolveLangGraphWorkflowCheckpointer;
     private buildRouteSystemPrompt;
     private resolveSubagents;
+    private createLangChainRunnable;
+    private normalizeLangGraphWorkflowNode;
+    private listLangGraphWorkflowNodes;
+    private normalizeLangGraphWorkflowEdge;
+    private listLangGraphWorkflowEdges;
+    private shouldFollowLangGraphEdge;
+    private listLangGraphWorkflowNextNodes;
+    private extractInvocationRequestText;
+    private prependSystemMessage;
+    private replaceLastUserMessage;
+    private resolveLangGraphSessionKey;
+    private resolveLangGraphSessionIdentity;
+    private langGraphCheckpointNamespace;
+    private langGraphCheckpointConfig;
+    private buildLangGraphWorkflowCheckpoint;
+    private saveLangGraphSessionToCheckpointer;
+    private loadLangGraphSessionFromCheckpointer;
+    private clearLangGraphSessionInCheckpointer;
+    private langGraphSessionFilePath;
+    private artifactLangGraphSessionFilePath;
+    private legacyLangGraphSessionFilePath;
+    private saveLangGraphSession;
+    private loadLangGraphSession;
+    private clearLangGraphSession;
+    private invokeWorkflowNodeModel;
+    private invokeLangGraphSpecialist;
+    private createLangGraphRunnable;
+    private extractExecutedToolResults;
+    private extractLangGraphResultOutput;
+    private streamLangGraphWorkflow;
     private createRunnable;
     create(binding: CompiledAgentBinding): Promise<RunnableLike>;
     route(input: MessageContent, primaryBinding: CompiledAgentBinding, secondaryBinding: CompiledAgentBinding, options?: {
         systemPrompt?: string;
     }): Promise<string>;
+    reviewRunResult(binding: CompiledAgentBinding, input: MessageContent, result: Pick<RunResult, "output" | "state" | "finalMessageText">): Promise<{
+        assessment: string;
+        modelId: string;
+    } | null>;
+    synthesizeFinalResult(binding: CompiledAgentBinding, input: MessageContent, result: Pick<RunResult, "output" | "state" | "finalMessageText">): Promise<{
+        output: string;
+        finalMessageText: string;
+        modelId: string;
+    } | null>;
     invoke(binding: CompiledAgentBinding, input: MessageContent, threadId: string, runId: string, resumePayload?: unknown, history?: TranscriptMessage[], options?: {
         context?: Record<string, unknown>;
         state?: Record<string, unknown>;
@@ -72,6 +118,7 @@ export declare class AgentRuntimeAdapter {
         context?: Record<string, unknown>;
         state?: Record<string, unknown>;
         files?: Record<string, unknown>;
+        runId?: string;
     }): AsyncGenerator<RuntimeStreamChunk | string>;
 }
 export { AgentRuntimeAdapter as RuntimeAdapter, AGENT_INTERRUPT_SENTINEL_PREFIX, AGENT_INTERRUPT_SENTINEL_PREFIX as INTERRUPT_SENTINEL_PREFIX, RuntimeOperationTimeoutError, };