npm - @poncho-ai/harness - Versions diffs - 0.28.3 → 0.30.0 - Mend

@poncho-ai/harness 0.28.3 → 0.30.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (9) hide show

package/.turbo/turbo-build.log CHANGED Viewed

@@ -1,5 +1,5 @@
-> @poncho-ai/harness@0.28.3 build /home/runner/work/poncho-ai/poncho-ai/packages/harness
+> @poncho-ai/harness@0.30.0 build /home/runner/work/poncho-ai/poncho-ai/packages/harness
 > node scripts/embed-docs.js && tsup src/index.ts --format esm --dts
 [embed-docs] Generated poncho-docs.ts with 4 topics
@@ -8,8 +8,8 @@
 [34mCLI[39m tsup v8.5.1
 [34mCLI[39m Target: es2022
 [34mESM[39m Build start
-[32mESM[39m [1mdist/index.js [22m[32m291.95 KB[39m
-[32mESM[39m ⚡️ Build success in 123ms
+[32mESM[39m [1mdist/index.js [22m[32m300.00 KB[39m
+[32mESM[39m ⚡️ Build success in 135ms
 [34mDTS[39m Build start
-[32mDTS[39m ⚡️ Build success in 6599ms
-[32mDTS[39m [1mdist/index.d.ts [22m[32m29.62 KB[39m
+[32mDTS[39m ⚡️ Build success in 7526ms
+[32mDTS[39m [1mdist/index.d.ts [22m[32m30.64 KB[39m

package/CHANGELOG.md CHANGED Viewed

@@ -1,5 +1,27 @@
 # @poncho-ai/harness
+## 0.30.0
+### Minor Changes
+- [`193c367`](https://github.com/cesr/poncho-ai/commit/193c367568dce22a470dff6acd022c221be3b722) Thanks [@cesr](https://github.com/cesr)! - Unified continuation logic across all entry points (chat, cron, subagents, SDK) with mid-stream soft deadline checkpointing and proper context preservation across continuation boundaries.
+### Patch Changes
+- Updated dependencies [[`193c367`](https://github.com/cesr/poncho-ai/commit/193c367568dce22a470dff6acd022c221be3b722)]:
+  - @poncho-ai/sdk@1.6.3
+## 0.29.0
+### Minor Changes
+- [#51](https://github.com/cesr/poncho-ai/pull/51) [`eb661a5`](https://github.com/cesr/poncho-ai/commit/eb661a554da6839702651671db8a8820ceb13f35) Thanks [@cesr](https://github.com/cesr)! - Add generic OTLP trace exporter for sending OpenTelemetry traces to any collector (Jaeger, Grafana Tempo, Honeycomb, etc.). Configure via `telemetry.otlp` as a URL string or `{ url, headers }` object. Works alongside or instead of Latitude telemetry.
+### Patch Changes
+- Updated dependencies [[`eb661a5`](https://github.com/cesr/poncho-ai/commit/eb661a554da6839702651671db8a8820ceb13f35)]:
+  - @poncho-ai/sdk@1.6.2
 ## 0.28.3
 ### Patch Changes

package/dist/index.d.ts CHANGED Viewed

@@ -176,6 +176,15 @@ interface Conversation {
     /** Harness-internal message chain preserved across continuation runs.
      *  Cleared when a run completes without continuation. */
     _continuationMessages?: Message[];
+    /** Number of continuation pickups for the current multi-step run.
+     *  Reset when a run completes without continuation. Used to enforce
+     *  a maximum continuation count across all entry points. */
+    _continuationCount?: number;
+    /** Full structured message chain from the last harness run, including
+     *  tool-call and tool-result messages the model needs for context.
+     *  Unlike `_continuationMessages`, this is always set after a run
+     *  and does NOT signal that a continuation is pending. */
+    _harnessMessages?: Message[];
     createdAt: number;
     updatedAt: number;
 }
@@ -411,7 +420,10 @@ interface PonchoConfig extends McpConfig {
     };
     telemetry?: {
         enabled?: boolean;
-        otlp?: string;
+        otlp?: string | {
+            url: string;
+            headers?: Record<string, string>;
+        };
         latitude?: {
             apiKeyEnv?: string;
             projectIdEnv?: string;
@@ -623,6 +635,9 @@ declare class AgentHarness {
     private readonly activeSkillNames;
     private readonly registeredMcpToolNames;
     private latitudeTelemetry?;
+    private otlpSpanProcessor?;
+    private otlpTracerProvider?;
+    private hasOtlpExporter;
     private insideTelemetryCapture;
     private _browserSession?;
     private _browserMod?;
@@ -686,8 +701,9 @@ declare class AgentHarness {
     shutdown(): Promise<void>;
     listTools(): ToolDefinition[];
     /**
-     * Wraps the run() generator with Latitude telemetry capture for complete trace coverage
-     * Streams events in real-time using an event queue pattern
+     * Wraps the run() generator with telemetry capture for complete trace coverage.
+     * Supports Latitude, generic OTLP, or both simultaneously.
+     * Streams events in real-time using an event queue pattern.
      */
     runWithTelemetry(input: RunInput): AsyncGenerator<AgentEvent>;
     compact(messages: Message[], options?: CompactMessagesOptions): Promise<CompactResult>;
@@ -804,9 +820,15 @@ declare const createSkillTools: (skills: SkillMetadata[], options?: {
 }) => ToolDefinition[];
 declare const normalizeScriptPolicyPath: (relativePath: string) => string;
+interface OtlpConfig {
+    url: string;
+    headers?: Record<string, string>;
+}
+type OtlpOption = string | OtlpConfig;
+declare function normalizeOtlp(opt: OtlpOption | undefined): OtlpConfig | undefined;
 interface TelemetryConfig {
     enabled?: boolean;
-    otlp?: string;
+    otlp?: OtlpOption;
     latitude?: {
         apiKeyEnv?: string;
         projectIdEnv?: string;
@@ -824,4 +846,4 @@ declare class TelemetryEmitter {
 declare const createSubagentTools: (manager: SubagentManager) => ToolDefinition[];
-export { type AgentFrontmatter, AgentHarness, type AgentIdentity, type AgentLimitsConfig, type AgentModelConfig, type BuiltInToolToggles, type CompactMessagesOptions, type CompactResult, type CompactionConfig, type Conversation, type ConversationState, type ConversationStore, type ConversationSummary, type CronJobConfig, type HarnessOptions, type HarnessRunOutput, InMemoryConversationStore, InMemoryStateStore, LatitudeCapture, type LatitudeCaptureConfig, LocalMcpBridge, LocalUploadStore, type MainMemory, type McpConfig, type MemoryConfig, type MemoryStore, type MessagingChannelConfig, type ModelProviderFactory, PONCHO_UPLOAD_SCHEME, type ParsedAgent, type PendingSubagentResult, type PonchoConfig, type ProviderConfig, type RemoteMcpServerConfig, type RuntimeRenderContext, S3UploadStore, STORAGE_SCHEMA_VERSION, type SkillContextEntry, type SkillMetadata, type StateConfig, type StateProviderName, type StateStore, type StorageConfig, type SubagentManager, type SubagentResult, type SubagentSpawnResult, type SubagentSummary, type TelemetryConfig, TelemetryEmitter, type ToolAccess, type ToolCall, ToolDispatcher, type ToolExecutionResult, type UploadStore, type UploadsConfig, VercelBlobUploadStore, buildAgentDirectoryName, buildSkillContextWindow, compactMessages, createConversationStore, createDefaultTools, createDeleteDirectoryTool, createDeleteTool, createEditTool, createMemoryStore, createMemoryTools, createModelProvider, createSearchTools, createSkillTools, createStateStore, createSubagentTools, createUploadStore, createWriteTool, deriveUploadKey, ensureAgentIdentity, estimateTokens, estimateTotalTokens, findSafeSplitPoint, generateAgentId, getAgentStoreDirectory, getModelContextWindow, getPonchoStoreRoot, jsonSchemaToZod, loadPonchoConfig, loadSkillContext, loadSkillInstructions, loadSkillMetadata, normalizeScriptPolicyPath, parseAgentFile, parseAgentMarkdown, ponchoDocsTool, readSkillResource, renderAgentPrompt, resolveAgentIdentity, resolveCompactionConfig, resolveMemoryConfig, resolveSkillDirs, resolveStateConfig, slugifyStorageComponent };
+export { type AgentFrontmatter, AgentHarness, type AgentIdentity, type AgentLimitsConfig, type AgentModelConfig, type BuiltInToolToggles, type CompactMessagesOptions, type CompactResult, type CompactionConfig, type Conversation, type ConversationState, type ConversationStore, type ConversationSummary, type CronJobConfig, type HarnessOptions, type HarnessRunOutput, InMemoryConversationStore, InMemoryStateStore, LatitudeCapture, type LatitudeCaptureConfig, LocalMcpBridge, LocalUploadStore, type MainMemory, type McpConfig, type MemoryConfig, type MemoryStore, type MessagingChannelConfig, type ModelProviderFactory, type OtlpConfig, type OtlpOption, PONCHO_UPLOAD_SCHEME, type ParsedAgent, type PendingSubagentResult, type PonchoConfig, type ProviderConfig, type RemoteMcpServerConfig, type RuntimeRenderContext, S3UploadStore, STORAGE_SCHEMA_VERSION, type SkillContextEntry, type SkillMetadata, type StateConfig, type StateProviderName, type StateStore, type StorageConfig, type SubagentManager, type SubagentResult, type SubagentSpawnResult, type SubagentSummary, type TelemetryConfig, TelemetryEmitter, type ToolAccess, type ToolCall, ToolDispatcher, type ToolExecutionResult, type UploadStore, type UploadsConfig, VercelBlobUploadStore, buildAgentDirectoryName, buildSkillContextWindow, compactMessages, createConversationStore, createDefaultTools, createDeleteDirectoryTool, createDeleteTool, createEditTool, createMemoryStore, createMemoryTools, createModelProvider, createSearchTools, createSkillTools, createStateStore, createSubagentTools, createUploadStore, createWriteTool, deriveUploadKey, ensureAgentIdentity, estimateTokens, estimateTotalTokens, findSafeSplitPoint, generateAgentId, getAgentStoreDirectory, getModelContextWindow, getPonchoStoreRoot, jsonSchemaToZod, loadPonchoConfig, loadSkillContext, loadSkillInstructions, loadSkillMetadata, normalizeOtlp, normalizeScriptPolicyPath, parseAgentFile, parseAgentMarkdown, ponchoDocsTool, readSkillResource, renderAgentPrompt, resolveAgentIdentity, resolveCompactionConfig, resolveMemoryConfig, resolveSkillDirs, resolveStateConfig, slugifyStorageComponent };

package/dist/index.js CHANGED Viewed

@@ -1529,11 +1529,17 @@ export default {
     },
   },
-  // Telemetry destination
+  // Telemetry destination \u2014 generic OTLP and/or Latitude
   telemetry: {
     enabled: true,
+    // Generic OTLP: string shorthand or { url, headers? } object
     otlp: process.env.OTEL_EXPORTER_OTLP_ENDPOINT,
-    // Or use Latitude (reads from LATITUDE_API_KEY and LATITUDE_PROJECT_ID env vars by default)
+    // With auth headers (Honeycomb, Grafana Cloud, etc.):
+    // otlp: {
+    //   url: 'https://api.honeycomb.io/v1/traces',
+    //   headers: { 'x-honeycomb-team': process.env.HONEYCOMB_API_KEY },
+    // },
+    // Latitude (reads from LATITUDE_API_KEY and LATITUDE_PROJECT_ID env vars by default)
     latitude: {
       // apiKeyEnv: 'LATITUDE_API_KEY',       // default
       // projectIdEnv: 'LATITUDE_PROJECT_ID', // default
@@ -1606,7 +1612,7 @@ Remote storage keys are namespaced and versioned, for example \`poncho:v1:<agent
 | \`PONCHO_AUTH_TOKEN\` | No | Unified auth token (Web UI passphrase + API Bearer token) |
 | \`PONCHO_INTERNAL_SECRET\` | No | Shared secret used by internal serverless callbacks (recommended for Vercel/Lambda) |
 | \`PONCHO_SELF_BASE_URL\` | No | Explicit base URL for internal self-callbacks when auto-detection is unavailable |
-| \`OTEL_EXPORTER_OTLP_ENDPOINT\` | No | Telemetry destination |
+| \`OTEL_EXPORTER_OTLP_ENDPOINT\` | No | OTLP trace endpoint (Jaeger, Tempo, Honeycomb, etc.) |
 | \`LATITUDE_API_KEY\` | No | Latitude dashboard integration |
 | \`LATITUDE_PROJECT_ID\` | No | Latitude project identifier for capture traces |
 | \`LATITUDE_PATH\` | No | Latitude prompt path for grouping traces |
@@ -1641,23 +1647,45 @@ Logs print to console:
 [event] run:completed {"type":"run:completed","runId":"run_abc123","result":{"status":"completed","response":"...","steps":3,"tokens":{"input":1500,"output":840}}}
 \`\`\`
-### Production telemetry
+### Production telemetry (generic OTLP)
-Send events to your observability stack:
+Send full OpenTelemetry traces (agent runs, LLM calls, tool executions) to any
+OTLP-compatible collector \u2014 Jaeger, Grafana Tempo, Honeycomb, Datadog, etc.
 \`\`\`bash
-# Environment variable
-OTEL_EXPORTER_OTLP_ENDPOINT=https://otel.example.com
+# Simple: just a URL
+OTEL_EXPORTER_OTLP_ENDPOINT=https://otel.example.com/v1/traces
 \`\`\`
-Or configure in code:
+\`\`\`javascript
+// poncho.config.js \u2014 string shorthand
+export default {
+  telemetry: {
+    otlp: 'https://otel.example.com/v1/traces',
+  }
+}
+\`\`\`
+\`\`\`javascript
+// poncho.config.js \u2014 with auth headers (Honeycomb, Grafana Cloud, etc.)
+export default {
+  telemetry: {
+    otlp: {
+      url: 'https://api.honeycomb.io/v1/traces',
+      headers: {
+        'x-honeycomb-team': process.env.HONEYCOMB_API_KEY,
+      },
+    },
+  }
+}
+\`\`\`
+You can also use a custom event handler for non-OTLP destinations:
 \`\`\`javascript
 // poncho.config.js
 export default {
   telemetry: {
-    otlp: 'https://otel.example.com',
-    // Or custom handler
     handler: async (event) => {
       await sendToMyLoggingService(event)
     }
@@ -1687,6 +1715,8 @@ telemetry: {
 }
 \`\`\`
+Both \`otlp\` and \`latitude\` can be configured simultaneously \u2014 all spans flow to both destinations.
 ## Security
 ### Protect your endpoint
@@ -4581,6 +4611,78 @@ var createSubagentTools = (manager) => [
 // src/harness.ts
 import { LatitudeTelemetry } from "@latitude-data/telemetry";
+import { trace, context as otelContext, SpanStatusCode } from "@opentelemetry/api";
+import { NodeTracerProvider, BatchSpanProcessor } from "@opentelemetry/sdk-trace-node";
+import { OTLPTraceExporter } from "@opentelemetry/exporter-trace-otlp-http";
+// src/telemetry.ts
+var MAX_FIELD_LENGTH = 200;
+function sanitizeEventForLog(event) {
+  return JSON.stringify(event, (_key, value) => {
+    if (typeof value === "string" && value.length > MAX_FIELD_LENGTH) {
+      return `${value.slice(0, 80)}...[${value.length} chars]`;
+    }
+    return value;
+  });
+}
+function normalizeOtlp(opt) {
+  if (!opt) return void 0;
+  if (typeof opt === "string") return opt ? { url: opt } : void 0;
+  return opt.url ? opt : void 0;
+}
+var TelemetryEmitter = class {
+  config;
+  constructor(config) {
+    this.config = config;
+  }
+  async emit(event) {
+    if (this.config?.enabled === false) {
+      return;
+    }
+    if (this.config?.handler) {
+      await this.config.handler(event);
+      return;
+    }
+    const otlp = normalizeOtlp(this.config?.otlp);
+    if (otlp) {
+      await this.sendOtlp(event, otlp);
+    }
+    process.stdout.write(`[event] ${event.type} ${sanitizeEventForLog(event)}
+`);
+  }
+  async sendOtlp(event, otlp) {
+    try {
+      await fetch(otlp.url, {
+        method: "POST",
+        headers: { "Content-Type": "application/json", ...otlp.headers },
+        body: JSON.stringify({
+          resourceLogs: [
+            {
+              scopeLogs: [
+                {
+                  logRecords: [
+                    {
+                      timeUnixNano: String(Date.now() * 1e6),
+                      severityText: "INFO",
+                      body: { stringValue: event.type },
+                      attributes: [
+                        {
+                          key: "event.payload",
+                          value: { stringValue: JSON.stringify(event) }
+                        }
+                      ]
+                    }
+                  ]
+                }
+              ]
+            }
+          ]
+        })
+      });
+    } catch {
+    }
+  }
+};
 // src/tool-dispatcher.ts
 var ToolDispatcher = class {
@@ -5113,6 +5215,9 @@ var AgentHarness = class _AgentHarness {
   activeSkillNames = /* @__PURE__ */ new Set();
   registeredMcpToolNames = /* @__PURE__ */ new Set();
   latitudeTelemetry;
+  otlpSpanProcessor;
+  otlpTracerProvider;
+  hasOtlpExporter = false;
   insideTelemetryCapture = false;
   _browserSession;
   _browserMod;
@@ -5560,6 +5665,31 @@ var AgentHarness = class _AgentHarness {
         `[poncho][telemetry] Latitude telemetry is configured but missing: ${missing.join(", ")}. Traces will NOT be sent.`
       );
     }
+    const otlpConfig = telemetryEnabled ? normalizeOtlp(config?.telemetry?.otlp) : void 0;
+    if (otlpConfig) {
+      const exporter = new OTLPTraceExporter({
+        url: otlpConfig.url,
+        headers: otlpConfig.headers
+      });
+      const processor = new BatchSpanProcessor(exporter);
+      this.otlpSpanProcessor = processor;
+      if (this.latitudeTelemetry) {
+        const globalProvider = trace.getTracerProvider();
+        const delegate = globalProvider.getDelegate?.() ?? globalProvider;
+        if (typeof delegate.addSpanProcessor === "function") {
+          delegate.addSpanProcessor(processor);
+        }
+        console.info(`[poncho][telemetry] OTLP exporter added (piggybacking on Latitude provider) \u2192 ${otlpConfig.url}`);
+      } else {
+        const provider2 = new NodeTracerProvider({
+          spanProcessors: [processor]
+        });
+        provider2.register();
+        this.otlpTracerProvider = provider2;
+        console.info(`[poncho][telemetry] OTLP exporter active (standalone provider) \u2192 ${otlpConfig.url}`);
+      }
+      this.hasOtlpExporter = true;
+    }
   }
   async buildBrowserStoragePersistence(config, sessionId) {
     const provider = config.storage?.provider ?? config.state?.provider ?? "local";
@@ -5710,13 +5840,31 @@ var AgentHarness = class _AgentHarness {
       });
       this.latitudeTelemetry = void 0;
     }
+    if (this.otlpSpanProcessor) {
+      await this.otlpSpanProcessor.shutdown().catch((err) => {
+        console.warn(
+          `[poncho][telemetry] OTLP span processor shutdown error: ${err instanceof Error ? err.message : String(err)}`
+        );
+      });
+      this.otlpSpanProcessor = void 0;
+    }
+    if (this.otlpTracerProvider) {
+      await this.otlpTracerProvider.shutdown().catch((err) => {
+        console.warn(
+          `[poncho][telemetry] OTLP tracer provider shutdown error: ${err instanceof Error ? err.message : String(err)}`
+        );
+      });
+      this.otlpTracerProvider = void 0;
+    }
+    this.hasOtlpExporter = false;
   }
   listTools() {
     return this.dispatcher.list();
   }
   /**
-   * Wraps the run() generator with Latitude telemetry capture for complete trace coverage
-   * Streams events in real-time using an event queue pattern
+   * Wraps the run() generator with telemetry capture for complete trace coverage.
+   * Supports Latitude, generic OTLP, or both simultaneously.
+   * Streams events in real-time using an event queue pattern.
    */
   async *runWithTelemetry(input) {
     const config = this.loadedConfig;
@@ -5783,6 +5931,39 @@ var AgentHarness = class _AgentHarness {
           }
         }
       }
+    } else if (this.hasOtlpExporter) {
+      const tracer = trace.getTracer("poncho");
+      const agentName = this.parsedAgent?.frontmatter.name ?? "agent";
+      const rootSpan = tracer.startSpan(`agent.run ${agentName}`);
+      rootSpan.setAttribute("poncho.agent.name", agentName);
+      if (input.conversationId) {
+        rootSpan.setAttribute("poncho.conversation.id", input.conversationId);
+      }
+      const spanContext = trace.setSpan(otelContext.active(), rootSpan);
+      this.insideTelemetryCapture = true;
+      try {
+        const gen = this.run(input);
+        let next;
+        do {
+          next = await otelContext.with(spanContext, () => gen.next());
+          if (!next.done) yield next.value;
+        } while (!next.done);
+        rootSpan.setStatus({ code: SpanStatusCode.OK });
+      } catch (error) {
+        rootSpan.setStatus({
+          code: SpanStatusCode.ERROR,
+          message: error instanceof Error ? error.message : String(error)
+        });
+        rootSpan.recordException(error instanceof Error ? error : new Error(String(error)));
+        throw error;
+      } finally {
+        this.insideTelemetryCapture = false;
+        rootSpan.end();
+        try {
+          await this.otlpSpanProcessor?.forceFlush();
+        } catch {
+        }
+      }
     } else {
       yield* this.run(input);
     }
@@ -5950,7 +6131,7 @@ ${this.skillFingerprint}`;
       if (lastMsg && lastMsg.role !== "user") {
         messages.push({
           role: "user",
-          content: "[System: Your previous turn was interrupted by a time limit. Continue from where you left off \u2014 do NOT repeat what you already said. Proceed directly with the next action or tool call.]",
+          content: "[System: Your previous turn was interrupted by a time limit. Your partial response above is already visible to the user. Continue EXACTLY from where you left off \u2014 do NOT restart, re-summarize, or repeat any content you already produced. If you were mid-sentence or mid-table, continue that sentence or table. Proceed directly with the next action or output.]",
           metadata: { timestamp: now(), id: randomUUID3() }
         });
       }
@@ -6271,7 +6452,7 @@ ${textContent}` };
           abortSignal: input.abortSignal,
           ...typeof maxTokens === "number" ? { maxTokens } : {},
           experimental_telemetry: {
-            isEnabled: telemetryEnabled && !!this.latitudeTelemetry,
+            isEnabled: telemetryEnabled && !!(this.latitudeTelemetry || this.hasOtlpExporter),
             recordInputs: true,
             recordOutputs: true
           }
@@ -6280,7 +6461,10 @@ ${textContent}` };
         let chunkCount = 0;
         const hasRunTimeout = timeoutMs > 0;
         const streamDeadline = hasRunTimeout ? start + timeoutMs : 0;
+        const hasSoftDeadline = softDeadlineMs > 0;
+        const INTER_CHUNK_TIMEOUT_MS = 6e4;
         const fullStreamIterator = result.fullStream[Symbol.asyncIterator]();
+        let softDeadlineFiredDuringStream = false;
         try {
           while (true) {
             if (isCancelled()) {
@@ -6288,8 +6472,8 @@ ${textContent}` };
               return;
             }
             if (hasRunTimeout) {
-              const remaining2 = streamDeadline - now();
-              if (remaining2 <= 0) {
+              const remaining = streamDeadline - now();
+              if (remaining <= 0) {
                 yield pushEvent({
                   type: "run:error",
                   runId,
@@ -6304,22 +6488,33 @@ ${textContent}` };
                 return;
               }
             }
-            const remaining = hasRunTimeout ? streamDeadline - now() : Infinity;
-            const timeout = chunkCount === 0 ? Math.min(remaining, FIRST_CHUNK_TIMEOUT_MS) : hasRunTimeout ? remaining : 0;
+            if (hasSoftDeadline && chunkCount > 0 && now() - start >= softDeadlineMs) {
+              softDeadlineFiredDuringStream = true;
+              break;
+            }
+            const hardRemaining = hasRunTimeout ? streamDeadline - now() : Infinity;
+            const softRemaining = hasSoftDeadline ? Math.max(0, start + softDeadlineMs - now()) : Infinity;
+            const deadlineRemaining = Math.min(hardRemaining, softRemaining);
+            const timeout = chunkCount === 0 ? Math.min(deadlineRemaining, FIRST_CHUNK_TIMEOUT_MS) : Math.min(deadlineRemaining, INTER_CHUNK_TIMEOUT_MS);
             let nextPart;
-            if (timeout <= 0 && chunkCount > 0) {
+            if (timeout <= 0 && chunkCount > 0 && !hasSoftDeadline) {
               nextPart = await fullStreamIterator.next();
             } else {
+              const effectiveTimeout = Math.max(timeout, 1);
               let timer;
               nextPart = await Promise.race([
                 fullStreamIterator.next(),
                 new Promise((resolve12) => {
-                  timer = setTimeout(() => resolve12(null), timeout);
+                  timer = setTimeout(() => resolve12(null), effectiveTimeout);
                 })
               ]);
               clearTimeout(timer);
             }
             if (nextPart === null) {
+              if (hasSoftDeadline && deadlineRemaining <= INTER_CHUNK_TIMEOUT_MS) {
+                softDeadlineFiredDuringStream = true;
+                break;
+              }
               const isFirstChunk = chunkCount === 0;
               console.error(
                 `[poncho][harness] Stream timeout waiting for ${isFirstChunk ? "first" : "next"} chunk: model="${modelName}", step=${step}, chunks=${chunkCount}, elapsed=${now() - start}ms`
@@ -6352,11 +6547,42 @@ ${textContent}` };
           fullStreamIterator.return?.(void 0)?.catch?.(() => {
           });
         }
+        if (softDeadlineFiredDuringStream) {
+          if (fullText.length > 0) {
+            messages.push({
+              role: "assistant",
+              content: fullText,
+              metadata: { timestamp: now(), id: randomUUID3(), step }
+            });
+          }
+          const result_ = {
+            status: "completed",
+            response: responseText + fullText,
+            steps: step,
+            tokens: { input: totalInputTokens, output: totalOutputTokens, cached: totalCachedTokens },
+            duration: now() - start,
+            continuation: true,
+            continuationMessages: [...messages],
+            maxSteps,
+            contextTokens: latestContextTokens + toolOutputEstimateSinceModel,
+            contextWindow
+          };
+          console.info(`[poncho][harness] Soft deadline fired mid-stream at step ${step} (${(now() - start).toFixed(0)}ms). Checkpointing with ${fullText.length} chars of partial text.`);
+          yield pushEvent({ type: "run:completed", runId, result: result_ });
+          return;
+        }
         if (isCancelled()) {
           yield emitCancellation();
           return;
         }
         if (softDeadlineMs > 0 && now() - start > softDeadlineMs) {
+          if (fullText.length > 0) {
+            messages.push({
+              role: "assistant",
+              content: fullText,
+              metadata: { timestamp: now(), id: randomUUID3(), step }
+            });
+          }
           const result_ = {
             status: "completed",
             response: responseText + fullText,
@@ -6442,6 +6668,13 @@ ${textContent}` };
               `[poncho][harness] Model "${modelName}" returned an empty response with finishReason="stop" on step ${step}.`
             );
           }
+          if (fullText.length > 0) {
+            messages.push({
+              role: "assistant",
+              content: fullText,
+              metadata: { timestamp: now(), id: randomUUID3(), step }
+            });
+          }
           responseText = fullText;
           yield pushEvent({
             type: "step:completed",
@@ -6459,7 +6692,8 @@ ${textContent}` };
             },
             duration: now() - start,
             contextTokens: latestContextTokens + toolOutputEstimateSinceModel,
-            contextWindow
+            contextWindow,
+            continuationMessages: [...messages]
           };
           yield pushEvent({ type: "run:completed", runId, result: result2 });
           return;
@@ -6555,6 +6789,27 @@ ${textContent}` };
               })
             );
           }
+        } else if (this.insideTelemetryCapture && this.hasOtlpExporter) {
+          const tracer = trace.getTracer("poncho");
+          for (const call of approvedCalls) {
+            const span = tracer.startSpan(`tool ${call.name}`, {
+              attributes: {
+                "poncho.tool.name": call.name,
+                "poncho.tool.call_id": call.id,
+                "poncho.tool.arguments": JSON.stringify(call.input)
+              }
+            });
+            toolSpans.set(call.id, {
+              end(opts) {
+                if (opts.result.isError) {
+                  span.setStatus({ code: SpanStatusCode.ERROR, message: String(opts.result.value) });
+                } else {
+                  span.setStatus({ code: SpanStatusCode.OK });
+                }
+                span.end();
+              }
+            });
+          }
         }
         const TOOL_DEADLINE_SENTINEL = /* @__PURE__ */ Symbol("tool_deadline");
         const toolDeadlineRemainingMs = softDeadlineMs > 0 ? softDeadlineMs - (now() - start) : Infinity;
@@ -6579,6 +6834,13 @@ ${textContent}` };
           batchResults = await this.dispatcher.executeBatch(approvedCalls, toolContext);
         }
         if (batchResults === TOOL_DEADLINE_SENTINEL) {
+          if (fullText.length > 0) {
+            messages.push({
+              role: "assistant",
+              content: fullText,
+              metadata: { timestamp: now(), id: randomUUID3(), step }
+            });
+          }
           const result_ = {
             status: "completed",
             response: responseText + fullText,
@@ -8066,73 +8328,6 @@ var createConversationStore = (config, options) => {
   return new InMemoryConversationStore(ttl);
 };
-// src/telemetry.ts
-var MAX_FIELD_LENGTH = 200;
-function sanitizeEventForLog(event) {
-  return JSON.stringify(event, (_key, value) => {
-    if (typeof value === "string" && value.length > MAX_FIELD_LENGTH) {
-      return `${value.slice(0, 80)}...[${value.length} chars]`;
-    }
-    return value;
-  });
-}
-var TelemetryEmitter = class {
-  config;
-  constructor(config) {
-    this.config = config;
-  }
-  async emit(event) {
-    if (this.config?.enabled === false) {
-      return;
-    }
-    if (this.config?.handler) {
-      await this.config.handler(event);
-      return;
-    }
-    if (this.config?.otlp) {
-      await this.sendOtlp(event);
-    }
-    process.stdout.write(`[event] ${event.type} ${sanitizeEventForLog(event)}
-`);
-  }
-  async sendOtlp(event) {
-    const endpoint = this.config?.otlp;
-    if (!endpoint) {
-      return;
-    }
-    try {
-      await fetch(endpoint, {
-        method: "POST",
-        headers: { "Content-Type": "application/json" },
-        body: JSON.stringify({
-          resourceLogs: [
-            {
-              scopeLogs: [
-                {
-                  logRecords: [
-                    {
-                      timeUnixNano: String(Date.now() * 1e6),
-                      severityText: "INFO",
-                      body: { stringValue: event.type },
-                      attributes: [
-                        {
-                          key: "event.payload",
-                          value: { stringValue: JSON.stringify(event) }
-                        }
-                      ]
-                    }
-                  ]
-                }
-              ]
-            }
-          ]
-        })
-      });
-    } catch {
-    }
-  }
-};
 // src/index.ts
 import { defineTool as defineTool7 } from "@poncho-ai/sdk";
 export {
@@ -8180,6 +8375,7 @@ export {
   loadSkillContext,
   loadSkillInstructions,
   loadSkillMetadata,
+  normalizeOtlp,
   normalizeScriptPolicyPath,
   parseAgentFile,
   parseAgentMarkdown,

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@poncho-ai/harness",
-  "version": "0.28.3",
+  "version": "0.30.0",
   "description": "Agent execution runtime - conversation loop, tool dispatch, streaming",
   "repository": {
     "type": "git",
@@ -25,6 +25,8 @@
     "@aws-sdk/client-dynamodb": "^3.988.0",
     "@latitude-data/telemetry": "^2.0.4",
     "@opentelemetry/api": "1.9.0",
+    "@opentelemetry/exporter-trace-otlp-http": "^0.213.0",
+    "@opentelemetry/sdk-trace-node": "^2.6.0",
     "ai": "^6.0.86",
     "cheerio": "^1.2.0",
     "jiti": "^2.6.1",
@@ -32,7 +34,7 @@
     "redis": "^5.10.0",
     "yaml": "^2.4.0",
     "zod": "^3.22.0",
-    "@poncho-ai/sdk": "1.6.1"
+    "@poncho-ai/sdk": "1.6.3"
   },
   "devDependencies": {
     "@types/mustache": "^4.2.6",

package/src/config.ts CHANGED Viewed

@@ -104,7 +104,10 @@ export interface PonchoConfig extends McpConfig {
   };
   telemetry?: {
     enabled?: boolean;
-    otlp?: string;
+    otlp?: string | {
+      url: string;
+      headers?: Record<string, string>;
+    };
     latitude?: {
       apiKeyEnv?: string;
       projectIdEnv?: string;

package/src/harness.ts CHANGED Viewed

@@ -36,6 +36,10 @@ import { createSearchTools } from "./search-tools.js";
 import { createSubagentTools } from "./subagent-tools.js";
 import type { SubagentManager } from "./subagent-manager.js";
 import { LatitudeTelemetry } from "@latitude-data/telemetry";
+import { trace, context as otelContext, SpanStatusCode } from "@opentelemetry/api";
+import { NodeTracerProvider, BatchSpanProcessor } from "@opentelemetry/sdk-trace-node";
+import { OTLPTraceExporter } from "@opentelemetry/exporter-trace-otlp-http";
+import { normalizeOtlp } from "./telemetry.js";
 import {
   isSiblingScriptsPattern,
   matchesRelativeScriptPattern,
@@ -560,6 +564,9 @@ export class AgentHarness {
   private readonly activeSkillNames = new Set<string>();
   private readonly registeredMcpToolNames = new Set<string>();
   private latitudeTelemetry?: LatitudeTelemetry;
+  private otlpSpanProcessor?: BatchSpanProcessor;
+  private otlpTracerProvider?: NodeTracerProvider;
+  private hasOtlpExporter = false;
   private insideTelemetryCapture = false;
   private _browserSession?: unknown;
   private _browserMod?: {
@@ -1079,6 +1086,37 @@ export class AgentHarness {
         `[poncho][telemetry] Latitude telemetry is configured but missing: ${missing.join(", ")}. Traces will NOT be sent.`,
       );
     }
+    // Generic OTLP trace exporter — works alongside or instead of Latitude.
+    const otlpConfig = telemetryEnabled ? normalizeOtlp(config?.telemetry?.otlp) : undefined;
+    if (otlpConfig) {
+      const exporter = new OTLPTraceExporter({
+        url: otlpConfig.url,
+        headers: otlpConfig.headers,
+      });
+      const processor = new BatchSpanProcessor(exporter);
+      this.otlpSpanProcessor = processor;
+      if (this.latitudeTelemetry) {
+        // Latitude already registered a global TracerProvider (v1.x) — add our
+        // processor to it so every span flows to both destinations.
+        const globalProvider = trace.getTracerProvider();
+        const delegate = (globalProvider as unknown as { getDelegate?: () => unknown })
+          .getDelegate?.() ?? globalProvider;
+        if (typeof (delegate as Record<string, unknown>).addSpanProcessor === "function") {
+          (delegate as unknown as { addSpanProcessor(p: BatchSpanProcessor): void }).addSpanProcessor(processor);
+        }
+        console.info(`[poncho][telemetry] OTLP exporter added (piggybacking on Latitude provider) → ${otlpConfig.url}`);
+      } else {
+        const provider = new NodeTracerProvider({
+          spanProcessors: [processor],
+        });
+        provider.register();
+        this.otlpTracerProvider = provider;
+        console.info(`[poncho][telemetry] OTLP exporter active (standalone provider) → ${otlpConfig.url}`);
+      }
+      this.hasOtlpExporter = true;
+    }
   }
   private async buildBrowserStoragePersistence(
@@ -1250,6 +1288,27 @@ export class AgentHarness {
       });
       this.latitudeTelemetry = undefined;
     }
+    if (this.otlpSpanProcessor) {
+      await this.otlpSpanProcessor.shutdown().catch((err) => {
+        console.warn(
+          `[poncho][telemetry] OTLP span processor shutdown error: ${
+            err instanceof Error ? err.message : String(err)
+          }`,
+        );
+      });
+      this.otlpSpanProcessor = undefined;
+    }
+    if (this.otlpTracerProvider) {
+      await this.otlpTracerProvider.shutdown().catch((err) => {
+        console.warn(
+          `[poncho][telemetry] OTLP tracer provider shutdown error: ${
+            err instanceof Error ? err.message : String(err)
+          }`,
+        );
+      });
+      this.otlpTracerProvider = undefined;
+    }
+    this.hasOtlpExporter = false;
   }
   listTools(): ToolDefinition[] {
@@ -1257,18 +1316,20 @@ export class AgentHarness {
   }
   /**
-   * Wraps the run() generator with Latitude telemetry capture for complete trace coverage
-   * Streams events in real-time using an event queue pattern
+   * Wraps the run() generator with telemetry capture for complete trace coverage.
+   * Supports Latitude, generic OTLP, or both simultaneously.
+   * Streams events in real-time using an event queue pattern.
    */
   async *runWithTelemetry(input: RunInput): AsyncGenerator<AgentEvent> {
     const config = this.loadedConfig;
     const telemetry = this.latitudeTelemetry;
     if (telemetry) {
+      // Latitude capture path — wraps run() inside telemetry.capture().
+      // If OTLP is also configured, spans flow to both via the shared provider.
       const latProjectIdEnv2 = config?.telemetry?.latitude?.projectIdEnv ?? "LATITUDE_PROJECT_ID";
       const projectId = parseInt(process.env[latProjectIdEnv2] ?? "", 10) as number;
       const rawPath = config?.telemetry?.latitude?.path ?? this.parsedAgent?.frontmatter.name ?? 'agent';
-      // Sanitize path for Latitude's DOCUMENT_PATH_REGEXP: /^([\w-]+\/)*([\w-.])+$/
       const path = rawPath.replace(/[^\w\-./]/g, '-').replace(/-+/g, '-').replace(/^-+|-+$/g, '') || 'agent';
       const rawConversationId = input.conversationId ?? (
@@ -1276,7 +1337,6 @@ export class AgentHarness {
           ? input.parameters.__activeConversationId
           : undefined
       );
-      // Latitude expects a UUID v4 for documentLogUuid; only pass it if valid
       const UUID_RE = /^[0-9a-f]{8}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{12}$/i;
       const conversationUuid = rawConversationId && UUID_RE.test(rawConversationId)
         ? rawConversationId
@@ -1286,13 +1346,11 @@ export class AgentHarness {
         `[poncho][telemetry] Latitude telemetry active – projectId=${projectId}, path="${path}"${conversationUuid ? `, conversation="${conversationUuid}"` : ""}`,
       );
-      // Event queue for streaming events in real-time
       const eventQueue: AgentEvent[] = [];
       let queueResolve: ((value: void) => void) | null = null;
       let generatorDone = false;
       let generatorError: Error | null = null;
-      // Start the generator inside telemetry.capture() (runs in background)
       const capturePromise = telemetry.capture({ projectId, path, conversationUuid }, async () => {
         this.insideTelemetryCapture = true;
         try {
@@ -1316,13 +1374,11 @@ export class AgentHarness {
         }
       });
-      // Yield events from the queue as they arrive
       try {
         while (!generatorDone || eventQueue.length > 0) {
           if (eventQueue.length > 0) {
             yield eventQueue.shift()!;
           } else if (!generatorDone) {
-            // Wait for next event
             await new Promise<void>((resolve) => {
               queueResolve = resolve;
             });
@@ -1344,8 +1400,47 @@ export class AgentHarness {
           }
         }
       }
+    } else if (this.hasOtlpExporter) {
+      // Standalone OTLP path — create a root span for the agent run so all
+      // child spans (LLM calls via Vercel AI SDK, tool spans) are grouped
+      // under a single trace.
+      const tracer = trace.getTracer("poncho");
+      const agentName = this.parsedAgent?.frontmatter.name ?? "agent";
+      const rootSpan = tracer.startSpan(`agent.run ${agentName}`);
+      rootSpan.setAttribute("poncho.agent.name", agentName);
+      if (input.conversationId) {
+        rootSpan.setAttribute("poncho.conversation.id", input.conversationId);
+      }
+      // Bind the root span's context so every async step (including
+      // streamText and tool calls) sees it as the parent span.
+      const spanContext = trace.setSpan(otelContext.active(), rootSpan);
+      this.insideTelemetryCapture = true;
+      try {
+        const gen = this.run(input);
+        let next: IteratorResult<AgentEvent>;
+        do {
+          next = await otelContext.with(spanContext, () => gen.next());
+          if (!next.done) yield next.value;
+        } while (!next.done);
+        rootSpan.setStatus({ code: SpanStatusCode.OK });
+      } catch (error) {
+        rootSpan.setStatus({
+          code: SpanStatusCode.ERROR,
+          message: error instanceof Error ? error.message : String(error),
+        });
+        rootSpan.recordException(error instanceof Error ? error : new Error(String(error)));
+        throw error;
+      } finally {
+        this.insideTelemetryCapture = false;
+        rootSpan.end();
+        try {
+          await this.otlpSpanProcessor?.forceFlush();
+        } catch { /* best-effort */ }
+      }
     } else {
-      // No telemetry configured, just pass through
       yield* this.run(input);
     }
   }
@@ -1548,7 +1643,7 @@ ${boundedMainMemory.trim()}`
       if (lastMsg && lastMsg.role !== "user") {
         messages.push({
           role: "user",
-          content: "[System: Your previous turn was interrupted by a time limit. Continue from where you left off — do NOT repeat what you already said. Proceed directly with the next action or tool call.]",
+          content: "[System: Your previous turn was interrupted by a time limit. Your partial response above is already visible to the user. Continue EXACTLY from where you left off — do NOT restart, re-summarize, or repeat any content you already produced. If you were mid-sentence or mid-table, continue that sentence or table. Proceed directly with the next action or output.]",
           metadata: { timestamp: now(), id: randomUUID() },
         });
       }
@@ -1941,7 +2036,7 @@ ${boundedMainMemory.trim()}`
           abortSignal: input.abortSignal,
           ...(typeof maxTokens === "number" ? { maxTokens } : {}),
           experimental_telemetry: {
-            isEnabled: telemetryEnabled && !!this.latitudeTelemetry,
+            isEnabled: telemetryEnabled && !!(this.latitudeTelemetry || this.hasOtlpExporter),
             recordInputs: true,
             recordOutputs: true,
           },
@@ -1953,7 +2048,10 @@ ${boundedMainMemory.trim()}`
         let chunkCount = 0;
         const hasRunTimeout = timeoutMs > 0;
         const streamDeadline = hasRunTimeout ? start + timeoutMs : 0;
+        const hasSoftDeadline = softDeadlineMs > 0;
+        const INTER_CHUNK_TIMEOUT_MS = 60_000;
         const fullStreamIterator = result.fullStream[Symbol.asyncIterator]();
+        let softDeadlineFiredDuringStream = false;
         try {
           while (true) {
             if (isCancelled()) {
@@ -1977,25 +2075,36 @@ ${boundedMainMemory.trim()}`
                 return;
               }
             }
-            const remaining = hasRunTimeout ? streamDeadline - now() : Infinity;
+            if (hasSoftDeadline && chunkCount > 0 && now() - start >= softDeadlineMs) {
+              softDeadlineFiredDuringStream = true;
+              break;
+            }
+            const hardRemaining = hasRunTimeout ? streamDeadline - now() : Infinity;
+            const softRemaining = hasSoftDeadline ? Math.max(0, (start + softDeadlineMs) - now()) : Infinity;
+            const deadlineRemaining = Math.min(hardRemaining, softRemaining);
             const timeout = chunkCount === 0
-              ? Math.min(remaining, FIRST_CHUNK_TIMEOUT_MS)
-              : hasRunTimeout ? remaining : 0;
+              ? Math.min(deadlineRemaining, FIRST_CHUNK_TIMEOUT_MS)
+              : Math.min(deadlineRemaining, INTER_CHUNK_TIMEOUT_MS);
             let nextPart: IteratorResult<(typeof result.fullStream) extends AsyncIterable<infer T> ? T : never> | null;
-            if (timeout <= 0 && chunkCount > 0) {
+            if (timeout <= 0 && chunkCount > 0 && !hasSoftDeadline) {
               nextPart = await fullStreamIterator.next();
             } else {
+              const effectiveTimeout = Math.max(timeout, 1);
               let timer: ReturnType<typeof setTimeout> | undefined;
               nextPart = await Promise.race([
                 fullStreamIterator.next(),
                 new Promise<null>((resolve) => {
-                  timer = setTimeout(() => resolve(null), timeout);
+                  timer = setTimeout(() => resolve(null), effectiveTimeout);
                 }),
               ]);
               clearTimeout(timer);
             }
             if (nextPart === null) {
+              if (hasSoftDeadline && deadlineRemaining <= INTER_CHUNK_TIMEOUT_MS) {
+                softDeadlineFiredDuringStream = true;
+                break;
+              }
               const isFirstChunk = chunkCount === 0;
               console.error(
                 `[poncho][harness] Stream timeout waiting for ${isFirstChunk ? "first" : "next"} chunk: model="${modelName}", step=${step}, chunks=${chunkCount}, elapsed=${now() - start}ms`,
@@ -2030,6 +2139,31 @@ ${boundedMainMemory.trim()}`
           fullStreamIterator.return?.(undefined)?.catch?.(() => {});
         }
+        if (softDeadlineFiredDuringStream) {
+          if (fullText.length > 0) {
+            messages.push({
+              role: "assistant",
+              content: fullText,
+              metadata: { timestamp: now(), id: randomUUID(), step },
+            });
+          }
+          const result_: RunResult = {
+            status: "completed",
+            response: responseText + fullText,
+            steps: step,
+            tokens: { input: totalInputTokens, output: totalOutputTokens, cached: totalCachedTokens },
+            duration: now() - start,
+            continuation: true,
+            continuationMessages: [...messages],
+            maxSteps,
+            contextTokens: latestContextTokens + toolOutputEstimateSinceModel,
+            contextWindow,
+          };
+          console.info(`[poncho][harness] Soft deadline fired mid-stream at step ${step} (${(now() - start).toFixed(0)}ms). Checkpointing with ${fullText.length} chars of partial text.`);
+          yield pushEvent({ type: "run:completed", runId, result: result_ });
+          return;
+        }
         if (isCancelled()) {
           yield emitCancellation();
           return;
@@ -2038,6 +2172,13 @@ ${boundedMainMemory.trim()}`
       // Post-streaming soft deadline: if the model stream took long enough to
       // push past the soft deadline, checkpoint now before tool execution.
       if (softDeadlineMs > 0 && now() - start > softDeadlineMs) {
+        if (fullText.length > 0) {
+          messages.push({
+            role: "assistant",
+            content: fullText,
+            metadata: { timestamp: now(), id: randomUUID(), step },
+          });
+        }
         const result_: RunResult = {
           status: "completed",
           response: responseText + fullText,
@@ -2138,6 +2279,13 @@ ${boundedMainMemory.trim()}`
             `[poncho][harness] Model "${modelName}" returned an empty response with finishReason="stop" on step ${step}.`,
           );
         }
+        if (fullText.length > 0) {
+          messages.push({
+            role: "assistant",
+            content: fullText,
+            metadata: { timestamp: now(), id: randomUUID(), step },
+          });
+        }
         responseText = fullText;
         yield pushEvent({
           type: "step:completed",
@@ -2156,6 +2304,7 @@ ${boundedMainMemory.trim()}`
           duration: now() - start,
           contextTokens: latestContextTokens + toolOutputEstimateSinceModel,
           contextWindow,
+          continuationMessages: [...messages],
         };
         yield pushEvent({ type: "run:completed", runId, result });
         return;
@@ -2275,7 +2424,7 @@ ${boundedMainMemory.trim()}`
         return;
       }
-      // Create telemetry tool spans so tool calls appear in Latitude traces
+      // Create telemetry tool spans so tool calls appear in traces
       type ToolSpanHandle = { end: (opts: { result: { value: unknown; isError: boolean } }) => void };
       const toolSpans = new Map<string, ToolSpanHandle>();
       if (this.insideTelemetryCapture && this.latitudeTelemetry) {
@@ -2288,6 +2437,27 @@ ${boundedMainMemory.trim()}`
             }),
           );
         }
+      } else if (this.insideTelemetryCapture && this.hasOtlpExporter) {
+        const tracer = trace.getTracer("poncho");
+        for (const call of approvedCalls) {
+          const span = tracer.startSpan(`tool ${call.name}`, {
+            attributes: {
+              "poncho.tool.name": call.name,
+              "poncho.tool.call_id": call.id,
+              "poncho.tool.arguments": JSON.stringify(call.input),
+            },
+          });
+          toolSpans.set(call.id, {
+            end(opts: { result: { value: unknown; isError: boolean } }) {
+              if (opts.result.isError) {
+                span.setStatus({ code: SpanStatusCode.ERROR, message: String(opts.result.value) });
+              } else {
+                span.setStatus({ code: SpanStatusCode.OK });
+              }
+              span.end();
+            },
+          });
+        }
       }
       // Race tool execution against the soft deadline so long-running tool
@@ -2322,6 +2492,13 @@ ${boundedMainMemory.trim()}`
       }
       if ((batchResults as unknown) === TOOL_DEADLINE_SENTINEL) {
+        if (fullText.length > 0) {
+          messages.push({
+            role: "assistant",
+            content: fullText,
+            metadata: { timestamp: now(), id: randomUUID(), step },
+          });
+        }
         const result_: RunResult = {
           status: "completed",
           response: responseText + fullText,

package/src/state.ts CHANGED Viewed

@@ -71,6 +71,15 @@ export interface Conversation {
   /** Harness-internal message chain preserved across continuation runs.
    *  Cleared when a run completes without continuation. */
   _continuationMessages?: Message[];
+  /** Number of continuation pickups for the current multi-step run.
+   *  Reset when a run completes without continuation. Used to enforce
+   *  a maximum continuation count across all entry points. */
+  _continuationCount?: number;
+  /** Full structured message chain from the last harness run, including
+   *  tool-call and tool-result messages the model needs for context.
+   *  Unlike `_continuationMessages`, this is always set after a run
+   *  and does NOT signal that a continuation is pending. */
+  _harnessMessages?: Message[];
   createdAt: number;
   updatedAt: number;
 }

package/src/telemetry.ts CHANGED Viewed

@@ -11,9 +11,22 @@ function sanitizeEventForLog(event: AgentEvent): string {
   });
 }
+export interface OtlpConfig {
+  url: string;
+  headers?: Record<string, string>;
+}
+export type OtlpOption = string | OtlpConfig;
+export function normalizeOtlp(opt: OtlpOption | undefined): OtlpConfig | undefined {
+  if (!opt) return undefined;
+  if (typeof opt === "string") return opt ? { url: opt } : undefined;
+  return opt.url ? opt : undefined;
+}
 export interface TelemetryConfig {
   enabled?: boolean;
-  otlp?: string;
+  otlp?: OtlpOption;
   latitude?: {
     apiKeyEnv?: string;
     projectIdEnv?: string;
@@ -38,8 +51,9 @@ export class TelemetryEmitter {
       await this.config.handler(event);
       return;
     }
-    if (this.config?.otlp) {
-      await this.sendOtlp(event);
+    const otlp = normalizeOtlp(this.config?.otlp);
+    if (otlp) {
+      await this.sendOtlp(event, otlp);
     }
     // Latitude telemetry is handled by LatitudeTelemetry (from
     // @latitude-data/telemetry) via harness.runWithTelemetry().
@@ -48,15 +62,11 @@ export class TelemetryEmitter {
     process.stdout.write(`[event] ${event.type} ${sanitizeEventForLog(event)}\n`);
   }
-  private async sendOtlp(event: AgentEvent): Promise<void> {
-    const endpoint = this.config?.otlp;
-    if (!endpoint) {
-      return;
-    }
+  private async sendOtlp(event: AgentEvent, otlp: OtlpConfig): Promise<void> {
     try {
-      await fetch(endpoint, {
+      await fetch(otlp.url, {
         method: "POST",
-        headers: { "Content-Type": "application/json" },
+        headers: { "Content-Type": "application/json", ...otlp.headers },
         body: JSON.stringify({
           resourceLogs: [
             {