npm - @tangle-network/agent-runtime - Versions diffs - 0.40.0 → 0.42.0 - Mend

@tangle-network/agent-runtime 0.40.0 → 0.42.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (44) hide show

package/dist/agent.d.ts +57 -2
package/dist/agent.js +54 -0
package/dist/agent.js.map +1 -1
package/dist/chunk-7JITYN6T.js +72 -0
package/dist/chunk-7JITYN6T.js.map +1 -0
package/dist/{chunk-3WQJRSUJ.js → chunk-BDGYYO7K.js} +3 -3
package/dist/{chunk-6HI3QUJD.js → chunk-HCL2ZG5L.js} +51 -5
package/dist/chunk-HCL2ZG5L.js.map +1 -0
package/dist/{chunk-HSX6PFZR.js → chunk-HVYOHJHK.js} +338 -2
package/dist/chunk-HVYOHJHK.js.map +1 -0
package/dist/{chunk-OISRXLWI.js → chunk-IFG6GX6A.js} +64 -40
package/dist/chunk-IFG6GX6A.js.map +1 -0
package/dist/chunk-NRZOXCJK.js +64 -0
package/dist/chunk-NRZOXCJK.js.map +1 -0
package/dist/{chunk-VFKBIZTY.js → chunk-WMBYQPYM.js} +5 -4
package/dist/chunk-WMBYQPYM.js.map +1 -0
package/dist/delegation-profile-1GbW5yA3.d.ts +73 -0
package/dist/{dynamic-BT9Ji3jE.d.ts → dynamic-B_7GgCwu.d.ts} +1 -1
package/dist/index.d.ts +7 -8
package/dist/index.js +9 -8
package/dist/index.js.map +1 -1
package/dist/{kb-gate-C4tho31v.d.ts → kb-gate-DTBum3vH.d.ts} +9 -1
package/dist/{loop-runner-bin-C1MuoT8c.d.ts → loop-runner-bin-CVoCBmYk.d.ts} +3 -3
package/dist/loop-runner-bin.d.ts +4 -5
package/dist/loop-runner-bin.js +3 -3
package/dist/loops.d.ts +65 -7
package/dist/loops.js +7 -1
package/dist/mcp/bin.js +28 -17
package/dist/mcp/bin.js.map +1 -1
package/dist/mcp/index.d.ts +6 -6
package/dist/mcp/index.js +17 -49
package/dist/mcp/index.js.map +1 -1
package/dist/{otel-export-xgf4J6bo.d.ts → otel-export-BzvF1Ela.d.ts} +1 -1
package/dist/profiles.d.ts +1 -2
package/dist/{types-CNs7_1R3.d.ts → types-Bcp071Jg.d.ts} +488 -3
package/package.json +11 -22
package/dist/chunk-6HI3QUJD.js.map +0 -1
package/dist/chunk-7ZECSZ3C.js +0 -400
package/dist/chunk-7ZECSZ3C.js.map +0 -1
package/dist/chunk-HSX6PFZR.js.map +0 -1
package/dist/chunk-OISRXLWI.js.map +0 -1
package/dist/chunk-VFKBIZTY.js.map +0 -1
package/dist/types-CsCCryln.d.ts +0 -489
/package/dist/{chunk-3WQJRSUJ.js.map → chunk-BDGYYO7K.js.map} +0 -0

package/dist/types-CsCCryln.d.ts DELETED Viewed

@@ -1,489 +0,0 @@
-import { ControlEvalResult, KnowledgeRequirement, ControlBudget, KnowledgeReadinessReport, ControlStep, ControlDecision, UserQuestion, DataAcquisitionPlan, ControlRunResult, RunRecord, TraceStore } from '@tangle-network/agent-eval';
-/**
- * @stable
- *
- * Core task, session, adapter, and stream-event types for the runtime.
- *
- * This module owns the public shape of every cross-cutting record (`TaskSpec`,
- * `RuntimeSession`, `RuntimeStreamEvent`). Everything else in the runtime
- * imports from here so type-level changes ripple in one place.
- */
-/** @stable */
-interface AgentTaskSpec {
-    id: string;
-    intent: string;
-    /** Domain is metadata, not an architectural boundary: tax, legal, gtm, creative, blueprint, redteam, etc. */
-    domain?: string;
-    inputs?: Record<string, unknown>;
-    requiredKnowledge?: KnowledgeRequirement[];
-    budget?: Partial<ControlBudget>;
-    metadata?: Record<string, unknown>;
-}
-/** @stable */
-interface AgentKnowledgeProvider {
-    buildReadiness?(task: AgentTaskSpec): Promise<KnowledgeReadinessReport> | KnowledgeReadinessReport;
-    answerQuestions?(questions: UserQuestion[], task: AgentTaskSpec): Promise<Record<string, string>> | Record<string, string>;
-    executeAcquisitionPlans?(plans: DataAcquisitionPlan[], task: AgentTaskSpec): Promise<string[]> | string[];
-    refreshReadiness?(input: {
-        task: AgentTaskSpec;
-        previous: KnowledgeReadinessReport;
-        userAnswers: Record<string, string>;
-        acquiredEvidenceIds: string[];
-    }): Promise<KnowledgeReadinessReport> | KnowledgeReadinessReport;
-}
-/** @stable */
-interface AgentTaskContext<TState, TAction, TActionResult, TEval extends ControlEvalResult = ControlEvalResult> {
-    task: AgentTaskSpec;
-    knowledge: KnowledgeReadinessReport;
-    state: TState;
-    evals: TEval[];
-    history: ControlStep<TState, TAction, TActionResult, TEval>[];
-    budget: ControlBudget;
-    stepIndex: number;
-    wallMs: number;
-    spentCostUsd: number;
-    remainingCostUsd?: number;
-    abortSignal: AbortSignal;
-}
-/** @stable */
-interface AgentAdapter<TState, TAction, TActionResult, TEval extends ControlEvalResult = ControlEvalResult> {
-    observe(ctx: {
-        task: AgentTaskSpec;
-        knowledge: KnowledgeReadinessReport;
-        history: ControlStep<TState, TAction, TActionResult, TEval>[];
-        abortSignal: AbortSignal;
-    }): Promise<TState> | TState;
-    validate(ctx: {
-        task: AgentTaskSpec;
-        knowledge: KnowledgeReadinessReport;
-        state: TState;
-        history: ControlStep<TState, TAction, TActionResult, TEval>[];
-        abortSignal: AbortSignal;
-    }): Promise<TEval[]> | TEval[];
-    decide(ctx: AgentTaskContext<TState, TAction, TActionResult, TEval>): Promise<ControlDecision<TAction>> | ControlDecision<TAction>;
-    act(action: TAction, ctx: AgentTaskContext<TState, TAction, TActionResult, TEval>): Promise<TActionResult> | TActionResult;
-    shouldStop?(ctx: AgentTaskContext<TState, TAction, TActionResult, TEval>): Promise<{
-        stop: boolean;
-        pass: boolean;
-        reason: string;
-        score?: number;
-    }> | {
-        stop: boolean;
-        pass: boolean;
-        reason: string;
-        score?: number;
-    };
-    onKnowledgeBlocked?(ctx: {
-        task: AgentTaskSpec;
-        knowledge: KnowledgeReadinessReport;
-        questions: UserQuestion[];
-        acquisitionPlans: DataAcquisitionPlan[];
-    }): Promise<ControlDecision<TAction>> | ControlDecision<TAction>;
-    getActionCostUsd?(ctx: {
-        action: TAction;
-        result: TActionResult;
-        task: AgentTaskSpec;
-        state: TState;
-        evals: TEval[];
-        history: ControlStep<TState, TAction, TActionResult, TEval>[];
-    }): number | undefined;
-    projectRunRecords?(result: ControlRunResult<TState, TAction, TActionResult, TEval>, task: AgentTaskSpec): RunRecord[];
-}
-/** @stable */
-type AgentTaskStatus = 'completed' | 'blocked' | 'failed' | 'aborted';
-/** @stable */
-type AgentRuntimeEvent<TState = unknown, TAction = unknown, TActionResult = unknown, TEval extends ControlEvalResult = ControlEvalResult> = {
-    type: 'task_start';
-    task: AgentTaskSpec;
-} | {
-    type: 'readiness_start';
-    task: AgentTaskSpec;
-} | {
-    type: 'readiness_end';
-    task: AgentTaskSpec;
-    knowledge: KnowledgeReadinessReport;
-} | {
-    type: 'questions_start';
-    task: AgentTaskSpec;
-    questions: UserQuestion[];
-} | {
-    type: 'questions_end';
-    task: AgentTaskSpec;
-    questions: UserQuestion[];
-    userAnswers: Record<string, string>;
-} | {
-    type: 'acquisition_start';
-    task: AgentTaskSpec;
-    acquisitionPlans: DataAcquisitionPlan[];
-} | {
-    type: 'acquisition_end';
-    task: AgentTaskSpec;
-    acquisitionPlans: DataAcquisitionPlan[];
-    acquiredEvidenceIds: string[];
-} | {
-    type: 'control_start';
-    task: AgentTaskSpec;
-    knowledge: KnowledgeReadinessReport;
-} | {
-    type: 'control_step';
-    task: AgentTaskSpec;
-    step: ControlStep<TState, TAction, TActionResult, TEval>;
-} | {
-    type: 'control_end';
-    task: AgentTaskSpec;
-    control: ControlRunResult<TState, TAction, TActionResult, TEval>;
-} | {
-    type: 'task_end';
-    task: AgentTaskSpec;
-    status: AgentTaskStatus;
-    reason: string;
-};
-/** @stable */
-type AgentRuntimeEventSink<TState = unknown, TAction = unknown, TActionResult = unknown, TEval extends ControlEvalResult = ControlEvalResult> = (event: AgentRuntimeEvent<TState, TAction, TActionResult, TEval>) => Promise<void> | void;
-/**
- * @stable
- *
- * Typed transport / backend failure detail. Carried on `backend_error` and
- * `final` events when the backend's stream throws or the upstream HTTP call
- * returns a non-success status. Lets consumers (a) distinguish "stream
- * completed with no text" from "stream never reached the model" and
- * (b) reconstruct the precise upstream signal (status + truncated body) when
- * building a `RunRecord.error`.
- *
- * `body` is truncated to 2 KiB by the backend so an HTML error page from a
- * misconfigured proxy never bloats event payloads or logs. Consumers needing
- * the full body should inspect the underlying `BackendTransportError.body`
- * via a custom `mapEvent` or backend wrapper.
- */
-interface BackendErrorDetail {
-    /**
-     * `'transport'` — upstream HTTP / network failure with optional status code.
-     * `'backend'` — the backend's `stream()` generator threw for a non-transport
-     * reason (e.g. a custom adapter error, sandbox crash).
-     */
-    kind: 'transport' | 'backend';
-    message: string;
-    /** Upstream HTTP status when known. `0` for connection / abort errors. */
-    status?: number;
-    /** Truncated response body (≤2 KiB). Diagnostic only — never machine-parsed. */
-    body?: string;
-}
-/**
- * @stable
- *
- * OpenAI Chat Completions tool descriptor. The shape mirrors the
- * `/v1/chat/completions` `tools[]` parameter so callers can pass tool
- * definitions through `createOpenAICompatibleBackend({ tools })` without any
- * runtime translation. The router proxies this shape verbatim to Anthropic
- * (translated server-side), DeepSeek, Groq, OpenAI, and Gemini — every model
- * that the eval surface targets.
- *
- * Callers that build their tool list from MCP servers should run a one-shot
- * MCP `tools/list` at config time and project the result into this shape. The
- * runtime intentionally does NOT depend on `@modelcontextprotocol/sdk` —
- * keeping the backend transport thin lets domain repos own MCP plumbing.
- */
-interface OpenAIChatTool {
-    type: 'function';
-    function: {
-        name: string;
-        description?: string;
-        parameters?: Record<string, unknown>;
-    };
-}
-/**
- * @stable
- *
- * `tool_choice` parameter for OpenAI-compat chat. Same shape as the OpenAI
- * spec: `'auto'` (default — model decides), `'none'` (disable tool calling
- * for this turn), `'required'` (force a tool call), or a specific function
- * pin `{ type: 'function', function: { name } }`.
- */
-type OpenAIChatToolChoice = 'auto' | 'none' | 'required' | {
-    type: 'function';
-    function: {
-        name: string;
-    };
-};
-/** @stable */
-type RuntimeStreamEvent = {
-    type: 'task_start';
-    task: AgentTaskSpec;
-    timestamp: string;
-} | {
-    type: 'readiness_start';
-    task: AgentTaskSpec;
-    timestamp: string;
-} | {
-    type: 'readiness_end';
-    task: AgentTaskSpec;
-    knowledge: KnowledgeReadinessReport;
-    decision: KnowledgeReadinessDecision;
-    timestamp: string;
-} | {
-    type: 'questions_start';
-    task: AgentTaskSpec;
-    questions: UserQuestion[];
-    timestamp: string;
-} | {
-    type: 'questions_end';
-    task: AgentTaskSpec;
-    questions: UserQuestion[];
-    userAnswers: Record<string, string>;
-    timestamp: string;
-} | {
-    type: 'acquisition_start';
-    task: AgentTaskSpec;
-    acquisitionPlans: DataAcquisitionPlan[];
-    timestamp: string;
-} | {
-    type: 'acquisition_end';
-    task: AgentTaskSpec;
-    acquisitionPlans: DataAcquisitionPlan[];
-    acquiredEvidenceIds: string[];
-    timestamp: string;
-} | {
-    type: 'session_created';
-    task: AgentTaskSpec;
-    session: RuntimeSession;
-    timestamp: string;
-} | {
-    type: 'session_resumed';
-    task: AgentTaskSpec;
-    session: RuntimeSession;
-    timestamp: string;
-} | {
-    type: 'backend_start';
-    task: AgentTaskSpec;
-    session: RuntimeSession;
-    backend: string;
-    timestamp: string;
-} | {
-    type: 'text_delta';
-    task?: AgentTaskSpec;
-    session?: RuntimeSession;
-    text: string;
-    timestamp?: string;
-} | {
-    type: 'reasoning_delta';
-    task?: AgentTaskSpec;
-    session?: RuntimeSession;
-    text: string;
-    timestamp?: string;
-} | {
-    type: 'tool_call';
-    task?: AgentTaskSpec;
-    session?: RuntimeSession;
-    toolName: string;
-    toolCallId?: string;
-    args?: unknown;
-    timestamp?: string;
-} | {
-    type: 'tool_result';
-    task?: AgentTaskSpec;
-    session?: RuntimeSession;
-    toolName: string;
-    toolCallId?: string;
-    result?: unknown;
-    timestamp?: string;
-} | {
-    type: 'llm_call';
-    task?: AgentTaskSpec;
-    session?: RuntimeSession;
-    model: string;
-    tokensIn?: number;
-    tokensOut?: number;
-    costUsd?: number;
-    latencyMs?: number;
-    finishReason?: string;
-    timestamp?: string;
-} | {
-    type: 'artifact';
-    task?: AgentTaskSpec;
-    session?: RuntimeSession;
-    artifactId: string;
-    name?: string;
-    mimeType?: string;
-    uri?: string;
-    content?: string;
-    metadata?: Record<string, unknown>;
-    timestamp?: string;
-} | {
-    type: 'proposal_created';
-    task?: AgentTaskSpec;
-    session?: RuntimeSession;
-    proposalId: string;
-    title: string;
-    status?: 'pending' | 'approved' | 'rejected';
-    timestamp?: string;
-} | {
-    type: 'backend_error';
-    task: AgentTaskSpec;
-    session?: RuntimeSession;
-    backend: string;
-    message: string;
-    recoverable: boolean;
-    /**
-     * Typed transport diagnostic. Present when the upstream returned a
-     * non-success HTTP status or every retry attempt threw. Consumers MUST
-     * surface this onto their `RunRecord.error` — silently treating a
-     * `backend_error` as "no output" hides credit exhaustion, auth failure,
-     * and upstream outages from operators.
-     *  - `kind: 'transport'` — HTTP / network failure with optional `status`
-     *    + truncated response `body`.
-     *  - `kind: 'backend'` — the backend's `stream()` generator threw for a
-     *    reason that isn't a recognized transport failure.
-     */
-    error?: BackendErrorDetail;
-    timestamp: string;
-} | {
-    type: 'backend_end';
-    task: AgentTaskSpec;
-    session: RuntimeSession;
-    backend: string;
-    timestamp: string;
-} | {
-    type: 'task_end';
-    task: AgentTaskSpec;
-    status: AgentTaskStatus;
-    reason: string;
-    timestamp: string;
-} | {
-    type: 'final';
-    task: AgentTaskSpec;
-    session?: RuntimeSession;
-    status: AgentTaskStatus;
-    reason: string;
-    text?: string;
-    metadata?: Record<string, unknown>;
-    /**
-     * Typed terminal-error diagnostic. Mirrors the `backend_error.error`
-     * shape so a consumer that only listens for `final` still receives a
-     * loud, structured failure when the backend never produced output. Only
-     * set when `status !== 'completed'`. Consumers building a `RunRecord`
-     * MUST map this to `RunRecord.error` rather than recording silent
-     * `error: null` with empty `finalText`.
-     */
-    error?: BackendErrorDetail;
-    timestamp: string;
-};
-/** @stable */
-interface RuntimeSession {
-    id: string;
-    backend: string;
-    status: 'active' | 'completed' | 'failed' | 'aborted';
-    resumeToken?: string;
-    createdAt: string;
-    updatedAt: string;
-    metadata?: Record<string, unknown>;
-}
-/** @stable */
-interface RuntimeSessionStore {
-    get(sessionId: string): Promise<RuntimeSession | undefined> | RuntimeSession | undefined;
-    put(session: RuntimeSession): Promise<void> | void;
-    appendEvent?(sessionId: string, event: RuntimeStreamEvent): Promise<void> | void;
-    listEvents?(sessionId: string): Promise<RuntimeStreamEvent[]> | RuntimeStreamEvent[];
-}
-/** @stable */
-interface AgentBackendInput {
-    task: AgentTaskSpec;
-    message?: string;
-    messages?: Array<{
-        role: string;
-        content: string;
-    }>;
-    inputs?: Record<string, unknown>;
-}
-/** @stable */
-interface AgentBackendContext {
-    task: AgentTaskSpec;
-    knowledge: KnowledgeReadinessReport;
-    session: RuntimeSession;
-    signal?: AbortSignal;
-    /**
-     * Conversation/run identifier when this call is part of a multi-agent run.
-     * Backends should stamp it into any trace/log emission so cross-participant
-     * events correlate. Absent when the call is a stand-alone `runAgentTask`.
-     */
-    runId?: string;
-    /**
-     * Deterministic turn id for this single call. Stable across retries of the
-     * same logical turn so a caching gateway / idempotent backend can dedupe.
-     */
-    turnId?: string;
-    /**
-     * If this call is itself nested inside a higher-order conversation
-     * (recursion via `createConversationBackend`), the enclosing turn's id.
-     * Used for trace stitching across nested orchestration.
-     */
-    parentTurnId?: string;
-    /**
-     * Headers to forward verbatim to any outbound HTTP the backend issues:
-     * `X-Tangle-Forwarded-Authorization`, `X-Tangle-Forwarded-Depth`,
-     * run/turn correlation. Backends that issue HTTP MUST merge these into
-     * the outbound request; backends that don't issue HTTP may ignore them.
-     */
-    propagatedHeaders?: Readonly<Record<string, string>>;
-}
-/** @stable */
-interface AgentExecutionBackend<TInput extends AgentBackendInput = AgentBackendInput> {
-    kind: string;
-    start?(input: TInput, context: Omit<AgentBackendContext, 'session'> & {
-        requestedSessionId?: string;
-    }): Promise<RuntimeSession> | RuntimeSession;
-    resume?(session: RuntimeSession, input: TInput, context: Omit<AgentBackendContext, 'session'>): Promise<RuntimeSession> | RuntimeSession;
-    stream(input: TInput, context: AgentBackendContext): AsyncIterable<RuntimeStreamEvent>;
-    stop?(session: RuntimeSession, reason: string): Promise<void> | void;
-}
-/** @stable */
-interface RunAgentTaskStreamOptions<TInput extends AgentBackendInput = AgentBackendInput> {
-    task: AgentTaskSpec;
-    backend: AgentExecutionBackend<TInput>;
-    input?: Omit<TInput, 'task'>;
-    knowledge?: AgentKnowledgeProvider;
-    sessionStore?: RuntimeSessionStore;
-    sessionId?: string;
-    resume?: boolean;
-    signal?: AbortSignal;
-    minimumReadinessScore?: number;
-}
-/** @stable */
-interface RunAgentTaskOptions<TState, TAction, TActionResult, TEval extends ControlEvalResult = ControlEvalResult> {
-    task: AgentTaskSpec;
-    adapter: AgentAdapter<TState, TAction, TActionResult, TEval>;
-    knowledge?: AgentKnowledgeProvider;
-    onEvent?: AgentRuntimeEventSink<TState, TAction, TActionResult, TEval>;
-    store?: TraceStore;
-    signal?: AbortSignal;
-    scenarioId?: string;
-    projectId?: string;
-    variantId?: string;
-    minimumReadinessScore?: number;
-}
-/** @stable */
-interface AgentTaskRunResult<TState, TAction, TActionResult, TEval extends ControlEvalResult = ControlEvalResult> {
-    task: AgentTaskSpec;
-    status: AgentTaskStatus;
-    knowledge: KnowledgeReadinessReport;
-    questions: UserQuestion[];
-    acquisitionPlans: DataAcquisitionPlan[];
-    userAnswers: Record<string, string>;
-    acquiredEvidenceIds: string[];
-    control: ControlRunResult<TState, TAction, TActionResult, TEval>;
-    runRecords: RunRecord[];
-}
-/** @stable */
-interface KnowledgeReadinessDecision {
-    passed: boolean;
-    status: 'ready' | 'blocked' | 'caveat';
-    reason: string;
-    readinessScore: number;
-    recommendedAction: KnowledgeReadinessReport['recommendedAction'];
-    severity: KnowledgeReadinessReport['severity'];
-    blockingGapIds: string[];
-    nonBlockingGapIds: string[];
-}
-export type { AgentTaskSpec as A, BackendErrorDetail as B, KnowledgeReadinessDecision as K, OpenAIChatTool as O, RuntimeStreamEvent as R, AgentBackendInput as a, AgentExecutionBackend as b, OpenAIChatToolChoice as c, AgentBackendContext as d, RunAgentTaskOptions as e, AgentTaskRunResult as f, RunAgentTaskStreamOptions as g, AgentRuntimeEvent as h, AgentTaskStatus as i, RuntimeSessionStore as j, RuntimeSession as k, AgentAdapter as l, AgentKnowledgeProvider as m, AgentRuntimeEventSink as n, AgentTaskContext as o };

/package/dist/{chunk-3WQJRSUJ.js.map → chunk-BDGYYO7K.js.map} RENAMED Viewed

File without changes