npm - @codemation/core - Versions diffs - 0.8.1 → 0.10.1 - Mend

@codemation/core 0.8.1 → 0.10.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (100) hide show

package/CHANGELOG.md +386 -0
package/dist/{EngineRuntimeRegistration.types-BP6tsaNP.d.ts → EngineRuntimeRegistration.types-D1fyApMI.d.ts} +2 -2
package/dist/{EngineWorkflowRunnerService-DzOCa1BW.d.cts → EngineRuntimeRegistration.types-pB3FnzqR.d.cts} +17 -17
package/dist/{InMemoryRunDataFactory-1iz7_SnO.d.cts → InMemoryRunDataFactory-Xw7v4-sj.d.cts} +31 -29
package/dist/InMemoryRunEventBusRegistry-VM3OWnHo.cjs +47 -0
package/dist/InMemoryRunEventBusRegistry-VM3OWnHo.cjs.map +1 -0
package/dist/InMemoryRunEventBusRegistry-sM4z4n_i.js +41 -0
package/dist/InMemoryRunEventBusRegistry-sM4z4n_i.js.map +1 -0
package/dist/{RunIntentService-BqhmdoA1.d.ts → RunIntentService-BE9CAkbf.d.ts} +966 -471
package/dist/{RunIntentService-S-1lW-gS.d.cts → RunIntentService-siBSjaaY.d.cts} +859 -493
package/dist/bootstrap/index.cjs +5 -2
package/dist/bootstrap/index.d.cts +212 -135
package/dist/bootstrap/index.d.ts +4 -4
package/dist/bootstrap/index.js +3 -3
package/dist/{bootstrap-Bx1u4cbS.cjs → bootstrap-Cm5ruQxx.cjs} +253 -2
package/dist/bootstrap-Cm5ruQxx.cjs.map +1 -0
package/dist/{bootstrap-BoknFKnw.js → bootstrap-D3r505ko.js} +236 -3
package/dist/bootstrap-D3r505ko.js.map +1 -0
package/dist/{index-CVs9rVhl.d.ts → index-DeLl1Tne.d.ts} +632 -230
package/dist/index.cjs +323 -176
package/dist/index.cjs.map +1 -1
package/dist/index.d.cts +544 -91
package/dist/index.d.ts +3 -3
package/dist/index.js +299 -166
package/dist/index.js.map +1 -1
package/dist/{runtime-DUW6tIJ1.js → runtime-BGNbRnqs.js} +934 -75
package/dist/runtime-BGNbRnqs.js.map +1 -0
package/dist/{runtime-Dvo2ru5A.cjs → runtime-DKXJwTNv.cjs} +1028 -73
package/dist/runtime-DKXJwTNv.cjs.map +1 -0
package/dist/testing.cjs +4 -4
package/dist/testing.cjs.map +1 -1
package/dist/testing.d.cts +2 -2
package/dist/testing.d.ts +2 -2
package/dist/testing.js +3 -3
package/package.json +7 -2
package/src/ai/AiHost.ts +42 -14
package/src/authoring/DefinedCollectionRegistry.ts +17 -0
package/src/authoring/defineCollection.types.ts +181 -0
package/src/authoring/definePollingTrigger.types.ts +396 -0
package/src/authoring/definePollingTriggerInternals.ts +74 -0
package/src/authoring/index.ts +19 -0
package/src/bootstrap/index.ts +9 -0
package/src/bootstrap/runtime/EngineRuntimeRegistrar.ts +8 -0
package/src/browser.ts +1 -0
package/src/contracts/CodemationTelemetryAttributeNames.ts +6 -0
package/src/contracts/NoOpNodeExecutionTelemetry.ts +2 -11
package/src/contracts/NoOpTelemetrySpanScope.ts +46 -10
package/src/contracts/assertionTypes.ts +63 -0
package/src/contracts/baseTypes.ts +12 -0
package/src/contracts/collectionTypes.ts +44 -0
package/src/contracts/credentialTypes.ts +23 -1
package/src/contracts/executionPersistenceContracts.ts +30 -0
package/src/contracts/index.ts +4 -0
package/src/contracts/runTypes.ts +37 -1
package/src/contracts/runtimeTypes.ts +42 -0
package/src/contracts/telemetryTypes.ts +8 -0
package/src/contracts/testTriggerTypes.ts +66 -0
package/src/contracts/workflowTypes.ts +36 -7
package/src/contracts.ts +59 -0
package/src/events/ConnectionInvocationEventPublisher.ts +46 -0
package/src/events/index.ts +1 -0
package/src/events/runEvents.ts +74 -0
package/src/execution/ChildExecutionScopeFactory.ts +55 -0
package/src/execution/DefaultExecutionContextFactory.ts +6 -0
package/src/execution/ExecutionTelemetryCostTrackingDecoratorFactory.ts +18 -0
package/src/execution/NodeExecutor.ts +10 -2
package/src/execution/NodeInstanceFactory.ts +13 -1
package/src/execution/NodeInstantiationError.ts +16 -0
package/src/execution/NodeRunStateWriter.ts +7 -0
package/src/execution/NodeRunStateWriterFactory.ts +7 -0
package/src/execution/WorkflowRunExecutionContextFactory.ts +3 -0
package/src/execution/index.ts +2 -0
package/src/index.ts +8 -0
package/src/orchestration/AbortControllerFactory.ts +9 -0
package/src/orchestration/NodeExecutionRequestHandlerService.ts +1 -0
package/src/orchestration/RunContinuationService.ts +3 -0
package/src/orchestration/RunStartService.ts +122 -3
package/src/orchestration/TestSuiteOrchestrator.ts +350 -0
package/src/orchestration/TestSuiteRunIdFactory.ts +11 -0
package/src/orchestration/TriggerRuntimeService.ts +34 -7
package/src/orchestration/index.ts +9 -0
package/src/runtime/EngineFactory.ts +12 -0
package/src/triggers/polling/PollingTriggerDedupWindow.ts +23 -0
package/src/triggers/polling/PollingTriggerLogger.ts +18 -0
package/src/triggers/polling/PollingTriggerRuntime.ts +122 -0
package/src/triggers/polling/index.ts +5 -0
package/src/types/index.ts +12 -9
package/src/workflow/definition/NodeIterationIdFactory.ts +26 -0
package/src/workflow/dsl/NodeIdSlugifier.ts +18 -0
package/src/workflow/dsl/WorkflowBuilder.ts +71 -3
package/src/workflow/dsl/WorkflowDefinitionError.ts +15 -0
package/src/workflow/index.ts +3 -0
package/dist/InMemoryRunEventBusRegistry-B0_C4OnP.cjs +0 -262
package/dist/InMemoryRunEventBusRegistry-B0_C4OnP.cjs.map +0 -1
package/dist/InMemoryRunEventBusRegistry-C2U83Hmv.js +0 -238
package/dist/InMemoryRunEventBusRegistry-C2U83Hmv.js.map +0 -1
package/dist/bootstrap-BoknFKnw.js.map +0 -1
package/dist/bootstrap-Bx1u4cbS.cjs.map +0 -1
package/dist/runtime-DUW6tIJ1.js.map +0 -1
package/dist/runtime-Dvo2ru5A.cjs.map +0 -1

package/src/contracts/assertionTypes.ts ADDED Viewed

@@ -0,0 +1,63 @@
+import type { JsonValue, NodeId } from "./workflowTypes";
+/**
+ * One assertion emitted by an assertion-emitting node (a node whose config sets
+ * `emitsAssertions: true`). Each emitted item on `main` carries one of these as `item.json`.
+ *
+ * Pass/fail is derived from `score >= (passThreshold ?? 0.5)` — see {@link deriveAssertionPassed}.
+ * The `errored` marker is for cases where the assertion code itself threw (distinct from
+ * "the assertion was evaluated and the score was low") and is treated as a hard fail in rollups
+ * regardless of `score`.
+ */
+export interface AssertionResult {
+  readonly name: string;
+  /** 0..1 score. Source of truth for pass/fail (compared against `passThreshold`). */
+  readonly score: number;
+  /** 0..1 threshold for "passed". When omitted, consumers default to 0.5. */
+  readonly passThreshold?: number;
+  /** True when evaluating the assertion threw — treated as fail regardless of `score`. */
+  readonly errored?: true;
+  /** What the assertion expected. Free-form JSON; UIs render with a JSON viewer. */
+  readonly expected?: JsonValue;
+  /** What the workflow actually produced. */
+  readonly actual?: JsonValue;
+  /** Short human-readable explanation, especially for fails / errors. */
+  readonly message?: string;
+  /** Bag of supplemental fields (e.g. judge prompt, judge raw response, comparison method). */
+  readonly details?: Readonly<Record<string, JsonValue>>;
+}
+/**
+ * Default {@link AssertionResult.passThreshold} when authors omit it. Boolean-style assertions
+ * (assertEqual / contains / etc.) emit `score: 1` or `score: 0` so this default works for them;
+ * AI-judge assertions are expected to set their own threshold.
+ */
+export const DEFAULT_ASSERTION_PASS_THRESHOLD = 0.5;
+/**
+ * Derive whether an assertion result is considered "passing" using the score-based contract:
+ * `errored` always fails, otherwise `score >= (passThreshold ?? 0.5)`. This is the canonical
+ * derivation — UI and rollup code should call it rather than inlining the comparison so future
+ * tweaks (e.g. NaN handling) land in one place.
+ */
+export function deriveAssertionPassed(result: {
+  readonly score: number;
+  readonly passThreshold?: number;
+  readonly errored?: true;
+}): boolean {
+  if (result.errored === true) return false;
+  const threshold = result.passThreshold ?? DEFAULT_ASSERTION_PASS_THRESHOLD;
+  return result.score >= threshold;
+}
+/**
+ * Provenance for a persisted {@link AssertionResult}: which node produced it and where in the
+ * per-item iteration tree it landed. Filled in by the host-side persister, not the node itself.
+ */
+export interface AssertionResultProvenance {
+  readonly nodeId: NodeId;
+  /** Per-item iteration id when the emitting node ran inside a per-item loop. */
+  readonly iterationId?: string;
+  /** Item index (0-based) within the activation that produced this assertion. */
+  readonly itemIndex?: number;
+}

package/src/contracts/baseTypes.ts ADDED Viewed

@@ -0,0 +1,12 @@
+/**
+ * Minimal base types that have no dependencies on other contracts.
+ * Used by credentialTypes, workflowTypes, and other contract layers
+ * to avoid circular dependencies.
+ */
+export type WorkflowId = string;
+export type NodeId = string;
+export type OutputPortKey = string;
+export type InputPortKey = string;
+export type PersistedTokenId = string;
+export type NodeConnectionName = string;

package/src/contracts/collectionTypes.ts ADDED Viewed

@@ -0,0 +1,44 @@
+/**
+ * Represents a typed store for a single collection.
+ * All rows include auto-managed id, created_at, and updated_at fields.
+ */
+export interface CollectionStore<TRow extends Record<string, unknown> = Record<string, unknown>> {
+  /**
+   * Insert a new row. id, created_at, and updated_at are auto-populated.
+   */
+  insert(row: TRow): Promise<TRow & { id: string; created_at: Date; updated_at: Date }>;
+  /**
+   * Get a single row by id.
+   */
+  get(id: string): Promise<(TRow & { id: string; created_at: Date; updated_at: Date }) | null>;
+  /**
+   * Find a single row matching the provided filter.
+   */
+  findOne(filter: Partial<TRow>): Promise<(TRow & { id: string; created_at: Date; updated_at: Date }) | null>;
+  /**
+   * List rows with optional pagination and filtering.
+   */
+  list(opts?: {
+    limit?: number;
+    offset?: number;
+    where?: Partial<TRow>;
+  }): Promise<{ rows: ReadonlyArray<TRow & { id: string; created_at: Date; updated_at: Date }>; total: number }>;
+  /**
+   * Update a row by id with partial data.
+   */
+  update(id: string, patch: Partial<TRow>): Promise<TRow & { id: string; created_at: Date; updated_at: Date }>;
+  /**
+   * Delete a row by id. Hard delete only (no soft delete).
+   */
+  delete(id: string): Promise<{ deleted: boolean }>;
+}
+/**
+ * Runtime collections context: keyed by collection name.
+ */
+export type CollectionsContext = Readonly<Record<string, CollectionStore>>;

package/src/contracts/credentialTypes.ts CHANGED Viewed

@@ -1,4 +1,4 @@
-import type { NodeId, WorkflowId } from "./workflowTypes";
+import type { NodeId, WorkflowId } from "./baseTypes";
 export type CredentialTypeId = string;
 export type CredentialInstanceId = string;
@@ -91,6 +91,28 @@ export type CredentialOAuth2AuthDefinition = Readonly<
       clientIdFieldKey?: string;
       clientSecretFieldKey?: string;
     }
+  | {
+      kind: "oauth2";
+      /**
+       * Free-form provider identifier for telemetry, DB rows, and Better Auth provider naming.
+       * Not used for any registry lookup — URLs come from {@link authorizeUrl} / {@link tokenUrl}.
+       */
+      providerId: string;
+      /**
+       * Authorization endpoint. May contain `{publicFieldKey}` placeholders that the runtime
+       * substitutes from the credential's resolved public config (URL-encoded).
+       * Example: `https://login.microsoftonline.com/{tenantId}/oauth2/v2.0/authorize`
+       */
+      authorizeUrl: string;
+      /** Token endpoint. Same templating rules as {@link authorizeUrl}. */
+      tokenUrl: string;
+      /** Optional userinfo endpoint. Same templating rules as {@link authorizeUrl}. */
+      userInfoUrl?: string;
+      scopes: ReadonlyArray<string>;
+      scopesFromPublicConfig?: CredentialOAuth2ScopesFromPublicConfig;
+      clientIdFieldKey?: string;
+      clientSecretFieldKey?: string;
+    }
 >;
 export type CredentialAuthDefinition = CredentialOAuth2AuthDefinition;

package/src/contracts/executionPersistenceContracts.ts CHANGED Viewed

@@ -148,6 +148,30 @@ export interface WorkflowRunDetailDto {
   readonly mutableState?: PersistedMutableRunState;
   readonly slotStates: ReadonlyArray<SlotExecutionStateDto>;
   readonly executionInstances: ReadonlyArray<ExecutionInstanceDto>;
+  readonly iterations?: ReadonlyArray<RunIterationDto>;
+}
+/**
+ * Per-item iteration projected from connection invocations and node activations.
+ *
+ * One iteration = one item processed by an agent within an activation. Multiple invocations
+ * (LLM rounds, tool calls) belonging to the same iteration share the iterationId.
+ */
+export interface RunIterationDto {
+  readonly iterationId: string;
+  readonly agentNodeId: NodeId;
+  readonly activationId: NodeActivationId;
+  readonly itemIndex: number;
+  readonly itemSummary?: string;
+  readonly status: NodeExecutionStatus;
+  readonly startedAt?: string;
+  readonly finishedAt?: string;
+  readonly invocationIds: ReadonlyArray<string>;
+  readonly parentInvocationId?: string;
+  /** Estimated cost rolled up from telemetry cost metric points, keyed by ISO currency code (e.g. "USD"). Values are minor units (cents-of-cents per the metric's `cost.currency_scale`). */
+  readonly estimatedCostMinorByCurrency?: Readonly<Record<string, number>>;
+  /** Currency scale (denominator) per currency, when present on the metric points. Joined with `estimatedCostMinorByCurrency` to format human-readable amounts. */
+  readonly estimatedCostCurrencyScaleByCurrency?: Readonly<Record<string, number>>;
 }
 export interface SlotExecutionStateDto {
@@ -178,6 +202,12 @@ export interface ExecutionInstanceDto {
   readonly inputJson?: JsonValue;
   readonly outputJson?: JsonValue;
   readonly error?: Readonly<NodeExecutionError>;
+  /** Per-item iteration that produced this instance. Set on connectionInvocation rows produced inside per-item runnable loops. */
+  readonly iterationId?: string;
+  /** Item index (0-based) of the iteration. */
+  readonly itemIndex?: number;
+  /** Parent invocation id when this instance was emitted by a sub-agent triggered by an outer LLM/tool call. */
+  readonly parentInvocationId?: string;
 }
 export interface WorkflowDetailSelectionState {

package/src/contracts/index.ts CHANGED Viewed

@@ -1,3 +1,6 @@
+export * from "./baseTypes";
+export * from "./assertionTypes";
+export * from "./collectionTypes";
 export * from "./credentialTypes";
 export * from "./emitPorts";
 export * from "./executionPersistenceContracts";
@@ -6,6 +9,7 @@ export * from "./params";
 export * from "./itemExpr";
 export * from "./runtimeTypes";
 export * from "./telemetryTypes";
+export * from "./testTriggerTypes";
 export * from "./runFinishedAtFactory";
 export * from "./runTypes";
 export * from "./webhookTypes";

package/src/contracts/runTypes.ts CHANGED Viewed

@@ -1,5 +1,5 @@
 import type { TypeToken } from "../di";
-import type { RunEventBus } from "../events/runEvents";
+import type { RunEventBus, TestCaseRunStatus } from "../events/runEvents";
 import type {
   Edge,
   InputPortKey,
@@ -7,6 +7,7 @@ import type {
   JsonValue,
   NodeActivationId,
   NodeId,
+  NodeIterationId,
   NodeKind,
   NodeOutputs,
   OutputPortKey,
@@ -19,6 +20,23 @@ import type {
   WorkflowNodeConnection,
 } from "./workflowTypes";
+/**
+ * Test-suite linkage for a run. When set, this run was started by a TestSuiteOrchestrator
+ * as one test case inside a TestSuiteRun. The `IsTestRun` node and host-side persisters key
+ * off the presence of this field. Subworkflow runs inherit it from their parent run.
+ */
+export interface RunTestContext {
+  readonly testSuiteRunId: string;
+  readonly testCaseIndex: number;
+  /**
+   * Optional human-friendly label for this test case (e.g. an email subject when fixtures
+   * are loaded from a mailbox). Resolved per item by `TestTrigger.caseLabel(item)` if set,
+   * persisted on `Run.test_case_label` so the Tests-tab tree-table can show "RFQ for batch 14"
+   * instead of "run_1777755971399_bbb86beac1396".
+   */
+  readonly testCaseLabel?: string;
+}
 export interface RunExecutionOptions {
   /** Run-intent override: force the inline scheduler and bypass node-level offload decisions. */
   localOnly?: boolean;
@@ -35,6 +53,8 @@ export interface RunExecutionOptions {
   maxNodeActivations?: number;
   /** Effective cap after engine policy merge (subworkflow nesting). */
   maxSubworkflowDepth?: number;
+  /** Present iff started by a TestSuiteOrchestrator; propagates to subworkflow runs via {@link ParentExecutionRef.testContext}. */
+  testContext?: RunTestContext;
 }
 /** Engine-owned counters persisted with the run (worker-safe). */
@@ -154,6 +174,12 @@ export interface ConnectionInvocationRecord {
   readonly startedAt?: string;
   readonly finishedAt?: string;
   readonly updatedAt: string;
+  /** Per-item iteration id minted by the engine when this invocation occurred inside a runnable node's per-item loop. */
+  readonly iterationId?: NodeIterationId;
+  /** Item index (0-based) of the iteration that produced this invocation. */
+  readonly itemIndex?: number;
+  /** When set, this invocation was produced inside a sub-agent triggered by the named parent invocation. */
+  readonly parentInvocationId?: ConnectionInvocationId;
 }
 /** Arguments for appending a {@link ConnectionInvocationRecord} (engine fills run/workflow ids and timestamps). */
@@ -169,6 +195,9 @@ export type ConnectionInvocationAppendArgs = Readonly<{
   queuedAt?: string;
   startedAt?: string;
   finishedAt?: string;
+  iterationId?: NodeIterationId;
+  itemIndex?: number;
+  parentInvocationId?: ConnectionInvocationId;
 }>;
 export interface RunCurrentState {
@@ -210,6 +239,13 @@ export interface RunSummary {
   workflowId: WorkflowId;
   startedAt: string;
   status: RunStatus;
+  /**
+   * Test-case status for runs dispatched as part of a TestSuiteRun. Carries the
+   * assertion-rollup-corrected outcome the test orchestrator persists onto the row, so the
+   * executions list can show "failed" for a run whose workflow completed cleanly but whose
+   * assertions caught regressions. Absent for non-test runs and legacy rows.
+   */
+  testCaseStatus?: TestCaseRunStatus;
   /** ISO timestamp when the run finished (derived from node snapshots or store `updatedAt`); omit while running/pending. */
   finishedAt?: string;
   parent?: ParentExecutionRef;

package/src/contracts/runtimeTypes.ts CHANGED Viewed

@@ -2,14 +2,17 @@ import type { ReadableStream as BinaryReadableStream } from "node:stream/web";
 import type { TypeToken } from "../di";
 import type { RunEventBus } from "../events/runEvents";
 import type { CredentialSessionService } from "./credentialTypes";
+import type { CollectionsContext } from "./collectionTypes";
 import type { ExecutionTelemetry, ExecutionTelemetryFactory, NodeExecutionTelemetry } from "./telemetryTypes";
 import type {
   ConnectionInvocationAppendArgs,
+  ConnectionInvocationId,
   NodeInputsByPort,
   PersistedWorkflowSnapshot,
   PersistedWorkflowTokenRegistryLike,
   RunExecutionOptions,
   RunResult,
+  RunTestContext,
   WorkflowExecutionRepository,
 } from "./runTypes";
 import type { WorkflowActivationPolicy } from "./workflowActivationPolicy";
@@ -25,6 +28,7 @@ import type {
   NodeActivationId,
   NodeConfigBase,
   NodeId,
+  NodeIterationId,
   NodeOutputs,
   RunnableNodeConfig,
   OutputPortKey,
@@ -154,6 +158,21 @@ export interface ExecutionContext {
   telemetry: ExecutionTelemetry;
   binary: ExecutionBinaryService;
   getCredential<TSession = unknown>(slotKey: string): Promise<TSession>;
+  /** Per-item iteration id, set by {@link NodeExecutor} on the ctx passed into runnable `execute`. */
+  iterationId?: NodeIterationId;
+  /** Item index (0-based) within the current activation's batch; set alongside {@link iterationId}. */
+  itemIndex?: number;
+  /** When set, this ctx is executing inside a sub-agent triggered by the named parent invocation. */
+  parentInvocationId?: ConnectionInvocationId;
+  /**
+   * Present iff the run was started by a TestSuiteOrchestrator. The {@link IsTestRunNode}
+   * branches on this; assertion-emitting nodes use it to decide whether to record results.
+   */
+  testContext?: RunTestContext;
+  /**
+   * Collections registered in the codemation config, keyed by collection name.
+   */
+  readonly collections?: CollectionsContext;
 }
 export interface ExecutionContextFactory {
@@ -169,6 +188,7 @@ export interface ExecutionContextFactory {
     nodeState?: NodeExecutionStatePublisher;
     telemetry?: ExecutionTelemetry;
     getCredential<TSession = unknown>(slotKey: string): Promise<TSession>;
+    testContext?: RunTestContext;
   }): ExecutionContext;
 }
@@ -180,6 +200,24 @@ export interface NodeExecutionContext<TConfig extends NodeConfigBase = NodeConfi
   binary: NodeBinaryAttachmentService;
 }
+export interface PollingTriggerHandle {
+  /**
+   * Start the polling loop. The runtime registers its own cleanup handle so callers do not need to
+   * call {@link TriggerSetupContext.registerCleanup} for the loop.
+   * @returns The state returned by the first cycle (or `undefined` when the overlap guard fired).
+   */
+  start<TState, TItem>(args: {
+    intervalMs: number;
+    seedState?: TState;
+    runCycle: (cycleCtx: {
+      previousState: TState | undefined;
+      signal: AbortSignal;
+    }) => Promise<{ items: Items<TItem>; nextState: TState }>;
+  }): Promise<TState | undefined>;
+  /** Convenience dedup-window helper. */
+  readonly dedup: import("../triggers/polling/PollingTriggerDedupWindow").PollingTriggerDedupWindow;
+}
 export interface TriggerSetupContext<
   TConfig extends TriggerNodeConfig<any, any> = TriggerNodeConfig<any, any>,
   TSetupState extends JsonValue | undefined = TriggerNodeSetupState<TConfig>,
@@ -189,6 +227,8 @@ export interface TriggerSetupContext<
   previousState: TSetupState;
   registerCleanup(cleanup: TriggerCleanupHandle): void;
   emit(items: Items): Promise<void>;
+  /** Generic polling-trigger surface. Pre-binds trigger id, emit, and registerCleanup. */
+  readonly polling: PollingTriggerHandle;
 }
 export interface TriggerTestItemsContext<
@@ -431,4 +471,6 @@ export interface EngineDeps {
   workflowPolicyRuntimeDefaults?: WorkflowPolicyRuntimeDefaults;
   /** When set, logs inactive-workflow skips at boot and trigger start/stop on activation changes. */
   triggerRuntimeDiagnostics?: TriggerRuntimeDiagnostics;
+  /** When set, the polling-trigger runtime uses this logger for cycle info/debug/error. */
+  pollingTriggerLogger?: import("../triggers/polling/PollingTriggerLogger").PollingTriggerLogger;
 }

package/src/contracts/telemetryTypes.ts CHANGED Viewed

@@ -73,6 +73,14 @@ export interface TelemetrySpanScope extends TelemetryScope {
   readonly traceId: string;
   readonly spanId: string;
   end(args?: TelemetrySpanEnd): Promise<void> | void;
+  /**
+   * Lift this span into a {@link NodeExecutionTelemetry} scoped to a different (nodeId, activationId).
+   * Children created via the returned telemetry's `startChildSpan` get this span as their parent.
+   *
+   * Used at the sub-agent boundary so that nested runtime telemetry parents under the agent.tool.call
+   * span instead of the orchestrator's node-level span.
+   */
+  asNodeTelemetry(args: Readonly<{ nodeId: NodeId; activationId: NodeActivationId }>): NodeExecutionTelemetry;
 }
 export interface NodeExecutionTelemetry extends ExecutionTelemetry, TelemetrySpanScope {

package/src/contracts/testTriggerTypes.ts ADDED Viewed

@@ -0,0 +1,66 @@
+import type { Item, NodeId, WorkflowId } from "./workflowTypes";
+import type { TriggerNodeConfig } from "./workflowTypes";
+/**
+ * Identifier minted by the host (or in-memory test runner) for one execution of a test suite.
+ * One TestSuiteRun produces N child workflow runs, one per item yielded by `generateItems`.
+ */
+export type TestSuiteRunId = string;
+/**
+ * Setup context passed to a {@link TestTriggerNodeConfig.generateItems} callback. Distinct from
+ * {@link import("./runtimeTypes").TriggerSetupContext} on purpose: test triggers are not
+ * activated by the live trigger lifecycle (webhooks, cron, polling) and never call `emit` —
+ * the orchestrator pulls from the iterable they return and dispatches one run per item.
+ */
+export interface TestTriggerSetupContext<
+  TConfig extends TestTriggerNodeConfig<unknown> = TestTriggerNodeConfig<unknown>,
+> {
+  readonly workflowId: WorkflowId;
+  readonly nodeId: NodeId;
+  readonly config: TConfig;
+  readonly testSuiteRunId: TestSuiteRunId;
+  /**
+   * Resolves a credential session for a slot declared on this trigger's
+   * {@link import("./workflowTypes").NodeConfigBase.getCredentialRequirements}. Same contract as
+   * {@link import("./runtimeTypes").ExecutionContext.getCredential}.
+   */
+  getCredential<TSession = unknown>(slotKey: string): Promise<TSession>;
+  /** AbortSignal raised when the suite is cancelled — long-running pulls should bail out. */
+  readonly signal: AbortSignal;
+}
+/**
+ * A trigger config that emits **test cases**. Each item yielded by {@link generateItems}
+ * becomes one workflow run (with `executionOptions.testContext` set), so 10 yielded items
+ * → 10 runs marked under the same TestSuiteRun.
+ *
+ * The trigger is otherwise a normal {@link TriggerNodeConfig} (so the canvas treats it like
+ * any other trigger), but its `triggerKind` is `"test"` so the live activation policy skips it.
+ */
+export interface TestTriggerNodeConfig<TOutputJson = unknown> extends TriggerNodeConfig<TOutputJson, undefined> {
+  readonly triggerKind: "test";
+  /**
+   * Author-supplied async iterable of items, evaluated lazily. Implementations may fetch from
+   * credentialed APIs, read fixture files, or yield hard-coded items. The orchestrator iterates
+   * and dispatches one run per item, with concurrency capped by {@link concurrency} (default 4).
+   */
+  generateItems(ctx: TestTriggerSetupContext<TestTriggerNodeConfig<TOutputJson>>): AsyncIterable<Item<TOutputJson>>;
+  /** Per-suite-run cap on simultaneously-executing test cases. Default: 4. */
+  readonly concurrency?: number;
+  /**
+   * Free-form description of where the test cases come from — surfaced in the node properties
+   * panel and the suite-detail header so authors revisiting the workflow six months later
+   * remember which mailbox / folder / fixture file the cases originate from.
+   *
+   * Example: `"All emails in the Gmail label \"test/triage-fixtures\" — 14 messages as of 2026-05-03."`
+   */
+  readonly description?: string;
+  /**
+   * Resolves a human-readable label for one yielded test case (e.g. email subject). The
+   * orchestrator calls this once per yielded item, persists the result on the run, and the
+   * Tests-tab UI uses it to render the case row instead of the opaque runId. Return
+   * `undefined` to fall back to "Case #N".
+   */
+  caseLabel?(item: Item<TOutputJson>): string | undefined;
+}

package/src/contracts/workflowTypes.ts CHANGED Viewed

@@ -3,13 +3,18 @@ import type { ZodType } from "zod";
 import type { TypeToken } from "../di";
 import type { CredentialRequirement } from "./credentialTypes";
 import type { RetryPolicySpec } from "./retryPolicySpec.types";
+import type { InputPortKey, NodeConnectionName, NodeId, OutputPortKey, WorkflowId } from "./baseTypes";
+export type {
+  InputPortKey,
+  NodeConnectionName,
+  NodeId,
+  OutputPortKey,
+  PersistedTokenId,
+  WorkflowId,
+} from "./baseTypes";
-export type WorkflowId = string;
-export type NodeId = string;
 export type NodeIdRef<TJson = unknown> = NodeId & Readonly<{ __codemationNodeJson?: TJson }>;
-export type OutputPortKey = string;
-export type InputPortKey = string;
-export type PersistedTokenId = string;
 export type NodeKind = "trigger" | "node";
 export type JsonPrimitive = string | number | boolean | null;
@@ -26,8 +31,6 @@ export interface Edge {
   to: { nodeId: NodeId; input: InputPortKey };
 }
-export type NodeConnectionName = string;
 /**
  * Named connection from a parent node to child nodes that exist in {@link WorkflowDefinition.nodes}
  * but are not traversed by the main execution graph. Parents are commonly executable nodes, but may
@@ -91,6 +94,14 @@ export interface NodeConfigBase {
   readonly declaredOutputPorts?: ReadonlyArray<OutputPortKey>;
   readonly declaredInputPorts?: ReadonlyArray<InputPortKey>;
   getCredentialRequirements?(): ReadonlyArray<CredentialRequirement>;
+  /**
+   * Marker: this node emits {@link import("./assertionTypes").AssertionResult}-shaped items on its
+   * `main` port. The TestSuiteOrchestrator (and host-side TestAssertionPersister) listen for
+   * `nodeCompleted` events from nodes with this flag set, and persist their output items as
+   * TestAssertion records (only when the run carries a `testContext`). Set on assertion node
+   * configs (e.g. `AssertionNodeConfig`, `StringEqualsAssertionNodeConfig`).
+   */
+  readonly emitsAssertions?: true;
 }
 export declare const runnableNodeInputType: unique symbol;
@@ -127,6 +138,12 @@ export interface TriggerNodeConfig<
   readonly kind: "trigger";
   readonly [triggerNodeOutputType]?: TOutputJson;
   readonly [triggerNodeSetupStateType]?: TSetupState;
+  /**
+   * Distinguishes triggers driven by the live activation policy (webhooks, cron, polling) from
+   * triggers driven only by the {@link TestSuiteOrchestrator}. `WorkflowActivation` skips
+   * `"test"` triggers; the orchestrator skips `"live"` triggers. Defaults to `"live"` when omitted.
+   */
+  readonly triggerKind?: "live" | "test";
 }
 export type RunnableNodeInputJson<TConfig extends RunnableNodeConfig<any, any>> =
@@ -194,6 +211,12 @@ export type NodeOutputs = Partial<Record<OutputPortKey, Items>>;
 export type RunId = string;
 export type NodeActivationId = string;
+/**
+ * One per-item iteration of a runnable node's execute loop. Refines `NodeActivationId` for
+ * per-item connection invocations and telemetry. Undefined when the executing node is a batch
+ * node or trigger that does not iterate items.
+ */
+export type NodeIterationId = string;
 export interface ParentExecutionRef {
   runId: RunId;
@@ -205,6 +228,12 @@ export interface ParentExecutionRef {
   engineMaxNodeActivations?: number;
   /** Effective max subworkflow depth from the parent run (propagated to child policy merge). */
   engineMaxSubworkflowDepth?: number;
+  /**
+   * Test-suite linkage inherited by the child subworkflow run. Set by whichever node
+   * spawns the subworkflow when its own `ctx.testContext` is present, so assertions
+   * emitted inside a subworkflow land under the correct parent test case.
+   */
+  testContext?: import("./runTypes").RunTestContext;
 }
 export interface RunDataSnapshot {

package/src/contracts.ts ADDED Viewed

@@ -0,0 +1,59 @@
+// Pure-type-only re-exports. Use this for type-only consumers that should not drag in runtime DSL or factory code.
+// This subpath prevents unnecessary compile-graph bloat for packages that only need types like NodeId, Items, etc.
+export type * from "./contracts/baseTypes";
+export type * from "./contracts/assertionTypes";
+// assertionTypes also exports a runtime helper for deriving pass/fail from a score+threshold.
+// We keep the type-only re-export above and surface the helper explicitly here so UI consumers
+// (next-host) don't need to re-implement the comparison.
+export { deriveAssertionPassed, DEFAULT_ASSERTION_PASS_THRESHOLD } from "./contracts/assertionTypes";
+export type * from "./contracts/params";
+export type * from "./contracts/retryPolicySpec.types";
+export type * from "./contracts/CostCatalogContract";
+export type * from "./contracts/executionPersistenceContracts";
+export type * from "./contracts/runtimeTypes";
+export type * from "./contracts/telemetryTypes";
+export type * from "./contracts/testTriggerTypes";
+export type * from "./contracts/runTypes";
+export type * from "./contracts/webhookTypes";
+export type * from "./contracts/workflowTypes";
+// credentialTypes mixes types (Credential* interfaces) with runtime (CredentialUnboundError class).
+// Export type-only subset for pure type consumers.
+export type {
+  CredentialTypeId,
+  CredentialInstanceId,
+  CredentialMaterialSourceKind,
+  CredentialSetupStatus,
+  CredentialHealthStatus,
+  CredentialFieldSchema,
+  CredentialRequirement,
+  CredentialBindingKey,
+  CredentialBinding,
+  CredentialHealth,
+  OAuth2ProviderFromPublicConfig,
+  CredentialOAuth2ScopesFromPublicConfig,
+  CredentialOAuth2AuthDefinition,
+  CredentialAuthDefinition,
+  CredentialAdvancedSectionPresentation,
+  CredentialTypeDefinition,
+  CredentialJsonRecord,
+  CredentialInstanceRecord,
+  CredentialSessionFactoryArgs,
+  CredentialSessionFactory,
+  CredentialHealthTester,
+  CredentialType,
+  AnyCredentialType,
+  CredentialSessionService,
+  CredentialTypeRegistry,
+} from "./contracts/credentialTypes";
+// CostTrackingTelemetryContract mixes types with const runtime values (metric/attribute names).
+// Export type-only subset for pure type consumers.
+export type {
+  CostTrackingComponent,
+  CostTrackingUsageRecord,
+  CostTrackingPriceQuote,
+  CostTrackingTelemetry,
+  CostTrackingTelemetryFactory,
+} from "./contracts/CostTrackingTelemetryContract";

package/src/events/ConnectionInvocationEventPublisher.ts ADDED Viewed

@@ -0,0 +1,46 @@
+import type { ConnectionInvocationRecord } from "../contracts/runTypes";
+import type { ParentExecutionRef } from "../types";
+import type { RunEventBus } from "./runEvents";
+/**
+ * Publishes per-invocation lifecycle records onto the run {@link RunEventBus}.
+ *
+ * Surgical, per-invocation events let the UI update the right-side inspector
+ * timeline as each LLM round / tool call transitions through `running` → `completed`
+ * (or `failed`) without depending on a coarse `runSaved` poll.
+ */
+export class ConnectionInvocationEventPublisher {
+  constructor(
+    private readonly eventBus: RunEventBus | undefined,
+    private readonly parent: ParentExecutionRef | undefined,
+  ) {}
+  async publish(record: ConnectionInvocationRecord): Promise<void> {
+    if (!this.eventBus) return;
+    const kind = this.kindFor(record);
+    if (!kind) return;
+    await this.eventBus.publish({
+      kind,
+      runId: record.runId,
+      workflowId: record.workflowId,
+      parent: this.parent,
+      at: record.updatedAt,
+      record,
+    });
+  }
+  private kindFor(
+    record: ConnectionInvocationRecord,
+  ): "connectionInvocationStarted" | "connectionInvocationCompleted" | "connectionInvocationFailed" | undefined {
+    if (record.status === "running" || record.status === "queued") {
+      return "connectionInvocationStarted";
+    }
+    if (record.status === "completed") {
+      return "connectionInvocationCompleted";
+    }
+    if (record.status === "failed") {
+      return "connectionInvocationFailed";
+    }
+    return undefined;
+  }
+}