npm - @zhijiewang/openharness - Versions diffs - 2.28.0 → 2.30.0 - Mend

@zhijiewang/openharness 2.28.0 → 2.30.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (13) hide show

package/README.md +8 -5
package/README.zh-CN.md +8 -5
package/dist/Tool.d.ts +4 -0
package/dist/commands/info.js +28 -0
package/dist/harness/traces.d.ts +8 -1
package/dist/harness/traces.js +18 -1
package/dist/query/index.js +208 -195
package/dist/query/tools.js +5 -0
package/dist/query/types.d.ts +3 -0
package/dist/repl.js +21 -0
package/dist/services/StreamingToolExecutor.js +5 -0
package/dist/tools/AgentTool/index.js +2 -2
package/package.json +1 -1

package/README.md CHANGED Viewed

@@ -21,7 +21,7 @@ AI coding agent in your terminal. Works with any LLM -- free local models or clo
   <img src="assets/openharness_v0.11.1_4.gif" alt="OpenHarness demo" width="800" />
 </p>
-[![npm version](https://img.shields.io/npm/v/@zhijiewang/openharness)](https://www.npmjs.com/package/@zhijiewang/openharness) [![npm downloads](https://img.shields.io/npm/dm/@zhijiewang/openharness)](https://www.npmjs.com/package/@zhijiewang/openharness) [![license](https://img.shields.io/npm/l/@zhijiewang/openharness)](LICENSE) ![tests](https://img.shields.io/badge/tests-890-brightgreen) ![tools](https://img.shields.io/badge/tools-42-blue) ![Node.js 18+](https://img.shields.io/badge/node-18%2B-green) ![TypeScript](https://img.shields.io/badge/typescript-strict-blue) [![GitHub stars](https://img.shields.io/github/stars/zhijiewong/openharness)](https://github.com/zhijiewong/openharness) [![GitHub issues](https://img.shields.io/github/issues-raw/zhijiewong/openharness)](https://github.com/zhijiewong/openharness/issues) [![PRs Welcome](https://img.shields.io/badge/PRs-welcome-brightgreen)](https://github.com/zhijiewong/openharness/pulls)
+[![npm version](https://img.shields.io/npm/v/@zhijiewang/openharness)](https://www.npmjs.com/package/@zhijiewang/openharness) [![npm downloads](https://img.shields.io/npm/dm/@zhijiewang/openharness)](https://www.npmjs.com/package/@zhijiewang/openharness) [![license](https://img.shields.io/npm/l/@zhijiewang/openharness)](LICENSE) ![tests](https://img.shields.io/badge/tests-1502-brightgreen) ![tools](https://img.shields.io/badge/tools-44-blue) ![Node.js 18+](https://img.shields.io/badge/node-18%2B-green) ![TypeScript](https://img.shields.io/badge/typescript-strict-blue) [![GitHub stars](https://img.shields.io/github/stars/zhijiewong/openharness)](https://github.com/zhijiewong/openharness) [![GitHub issues](https://img.shields.io/github/issues-raw/zhijiewong/openharness)](https://github.com/zhijiewong/openharness/issues) [![PRs Welcome](https://img.shields.io/badge/PRs-welcome-brightgreen)](https://github.com/zhijiewong/openharness/pulls)
 **English** | [简体中文](README.zh-CN.md)
@@ -32,7 +32,7 @@ AI coding agent in your terminal. Works with any LLM -- free local models or clo
 - [Quick Start](#quick-start)
 - [Why OpenHarness?](#why-openharness)
 - [Terminal UI](#terminal-ui)
-- [Tools (43)](#tools-43)
+- [Tools (44)](#tools-43)
 - [Slash Commands](#slash-commands)
 - [Permission Modes](#permission-modes)
 - [Hooks](#hooks)
@@ -114,8 +114,11 @@ Scrolling is handled by the terminal's native scrollbar. Completed messages flow
 - **Syntax highlighting** — keywords, strings, comments, numbers, types (JS/TS/Python/Rust/Go and 20+ languages)
 - **Collapsible code blocks** — blocks over 8 lines auto-collapse; `Ctrl+K` to expand all
 - **Collapsible thinking** — thinking blocks collapse to a one-line summary after completion; `Ctrl+O` to expand
-- **Shimmer spinner** — animated "Thinking" indicator with color transitions (magenta → yellow at 30s → red at 60s)
-- **Tool call display** — args preview, live streaming output, result summaries (line counts, elapsed time), expand/collapse with `Tab`
+- **Shimmer spinner** — animated indicator with stage label (`Thinking`, `Running <Tool>`, `Calling <server>:<tool>`, `Running N tools`) and color transitions (magenta → yellow at 30s → red at 60s)
+- **Tool call display** — args preview, live streaming output, result summaries (line counts, elapsed time), expand/collapse with `Tab`. Tool name color-coded by category (read tools cyan, mutating tools yellow, exec tools magenta, MCP tools green)
+- **Rich tool output** — JSON files render as a colored static tree (depth-3 collapse, line truncation); markdown files render with full styling (headings, code blocks, tables) instead of plain split-on-newline. Renderer dispatches via `outputType` field stamped by FileReadTool / WebFetchTool, with a heuristic fallback for unstamped tools
+- **Nested tool calls** — when `Agent` or `ParallelAgents` spawns inner tool calls (Read, Bash, Edit), the children render indented under their spawning parent. ParallelAgents shows per-task `Task` wrapper rows so child calls group by task instead of flat under the bundled parent. Depth-3 indent limit with `… (N more level)` collapse marker
+- **Multi-line input wrap glyph** — every non-last line of a multi-line input ends with a dim `↵` continuation marker so the wrap is visually obvious
 - **Permission prompts** — bordered box with risk coloring, bold colored **Y**es/**N**o/**D**iff keys, syntax-highlighted inline diffs
 - **Status line** — model name, token count, cost, context usage bar (customizable via config)
 - **Context warning** — yellow alert when context window exceeds 75%
@@ -146,7 +149,7 @@ statusLineFormat: '{model} │ {tokens} │ {cost} │ {ctx}'
 Available variables: `{model}`, `{tokens}` (input↑ output↓), `{cost}` ($X.XXXX), `{ctx}` (context usage bar). Empty sections are automatically collapsed.
-## Tools (43)
+## Tools (44)
 | Tool | Risk | Description |
 |------|------|-------------|

package/README.zh-CN.md CHANGED Viewed

@@ -21,7 +21,7 @@
   <img src="assets/openharness_v0.11.1_4.gif" alt="OpenHarness demo" width="800" />
 </p>
-[![npm version](https://img.shields.io/npm/v/@zhijiewang/openharness)](https://www.npmjs.com/package/@zhijiewang/openharness) [![npm downloads](https://img.shields.io/npm/dm/@zhijiewang/openharness)](https://www.npmjs.com/package/@zhijiewang/openharness) [![license](https://img.shields.io/npm/l/@zhijiewang/openharness)](LICENSE) ![tests](https://img.shields.io/badge/tests-890-brightgreen) ![tools](https://img.shields.io/badge/tools-42-blue) ![Node.js 18+](https://img.shields.io/badge/node-18%2B-green) ![TypeScript](https://img.shields.io/badge/typescript-strict-blue) [![GitHub stars](https://img.shields.io/github/stars/zhijiewong/openharness)](https://github.com/zhijiewong/openharness) [![GitHub issues](https://img.shields.io/github/issues-raw/zhijiewong/openharness)](https://github.com/zhijiewong/openharness/issues) [![PRs Welcome](https://img.shields.io/badge/PRs-welcome-brightgreen)](https://github.com/zhijiewong/openharness/pulls)
+[![npm version](https://img.shields.io/npm/v/@zhijiewang/openharness)](https://www.npmjs.com/package/@zhijiewang/openharness) [![npm downloads](https://img.shields.io/npm/dm/@zhijiewang/openharness)](https://www.npmjs.com/package/@zhijiewang/openharness) [![license](https://img.shields.io/npm/l/@zhijiewang/openharness)](LICENSE) ![tests](https://img.shields.io/badge/tests-1502-brightgreen) ![tools](https://img.shields.io/badge/tools-44-blue) ![Node.js 18+](https://img.shields.io/badge/node-18%2B-green) ![TypeScript](https://img.shields.io/badge/typescript-strict-blue) [![GitHub stars](https://img.shields.io/github/stars/zhijiewong/openharness)](https://github.com/zhijiewong/openharness) [![GitHub issues](https://img.shields.io/github/issues-raw/zhijiewong/openharness)](https://github.com/zhijiewong/openharness/issues) [![PRs Welcome](https://img.shields.io/badge/PRs-welcome-brightgreen)](https://github.com/zhijiewong/openharness/pulls)
 [English](README.md) | **简体中文**
@@ -32,7 +32,7 @@
 - [快速开始](#快速开始)
 - [为什么选择 OpenHarness？](#为什么选择-openharness)
 - [终端界面](#终端界面)
-- [工具（43 个）](#工具43-个)
+- [工具（44 个）](#工具43-个)
 - [斜杠命令](#斜杠命令)
 - [权限模式](#权限模式)
 - [钩子](#钩子)
@@ -114,8 +114,11 @@ OpenHarness 采用受 Ink/Claude Code 默认模式启发的顺序式终端渲染
 - **语法高亮** —— 关键字、字符串、注释、数字、类型（支持 JS/TS/Python/Rust/Go 等 20+ 种语言）
 - **可折叠代码块** —— 超过 8 行的代码块会自动折叠；按 `Ctrl+K` 全部展开
 - **可折叠思考块** —— 思考块在完成后会折叠为一行摘要；按 `Ctrl+O` 展开
-- **流光加载动画** —— 带颜色过渡的 "Thinking" 指示器（30 秒后洋红 → 黄，60 秒后 → 红）
-- **工具调用显示** —— 参数预览、实时流式输出、结果摘要（行数、耗时），按 `Tab` 展开/折叠
+- **流光加载动画** —— 带阶段标签（`Thinking`、`Running <Tool>`、`Calling <server>:<tool>`、`Running N tools`）和颜色过渡的指示器（30 秒后洋红 → 黄，60 秒后 → 红）
+- **工具调用显示** —— 参数预览、实时流式输出、结果摘要（行数、耗时），按 `Tab` 展开/折叠。工具名称按类别着色（读取类青色、修改类黄色、执行类品红色、MCP 类绿色）
+- **富工具输出** —— JSON 文件以彩色静态树形渲染（深度 3 级折叠、行数截断）；Markdown 文件完整渲染样式（标题、代码块、表格），不再是普通的按行拆分。渲染器通过 `outputType` 字段分发（FileReadTool / WebFetchTool 会标注），未标注的工具走启发式回退路径
+- **嵌套工具调用** —— 当 `Agent` 或 `ParallelAgents` 派生内层工具调用（Read、Bash、Edit）时,子调用会缩进显示在派生它的父调用之下。ParallelAgents 还会显示每个任务的 `Task` 包装行,使子调用按任务分组,而不是平铺在合并的父调用之下。深度 3 级缩进上限,超过显示 `… (N more level)` 折叠标记
+- **多行输入折行符** —— 多行输入的每一非末尾行都以暗色 `↵` 续行符结尾,使折行视觉清晰
 - **权限提示** —— 带边框的提示框，按风险级别着色，醒目的 **Y**es/**N**o/**D**iff 按键，内联 diff 带语法高亮
 - **状态栏** —— 显示模型名称、token 计数、费用、上下文占用条（可通过配置自定义）
 - **上下文告警** —— 上下文窗口超过 75% 时显示黄色警告
@@ -146,7 +149,7 @@ statusLineFormat: '{model} │ {tokens} │ {cost} │ {ctx}'
 可用变量：`{model}`、`{tokens}`（输入↑ 输出↓）、`{cost}`（$X.XXXX）、`{ctx}`（上下文占用条）。空片段会自动折叠。
-## 工具（43 个）
+## 工具（44 个）
 | 工具 | 风险 | 描述 |
 |------|------|-------------|

package/dist/Tool.d.ts CHANGED Viewed

@@ -29,6 +29,10 @@ export type ToolContext = {
     gitCommitPerTool?: boolean;
     /** Forward an inner-query tool event to the outer event stream, stamped with the parent's callId. Used by AgentTool and AgentDispatcher to surface nested tool calls. */
     emitChildEvent?: (event: ToolCallStart | ToolCallComplete | ToolCallEnd | ToolOutputDelta) => void;
+    /** Optional session tracer for OTel-style span emission around tool execution. */
+    tracer?: import("./harness/traces.js").SessionTracer;
+    /** Optional parent span ID for the current tool execution (set by query loop). */
+    parentSpanId?: string;
 };
 export type Tool<Input extends z.ZodType = z.ZodType> = {
     readonly name: string;

package/dist/commands/info.js CHANGED Viewed

@@ -11,6 +11,7 @@ import { getContextWindow } from "../harness/cost.js";
 import { getHooks, invalidateHookCache } from "../harness/hooks.js";
 import { discoverPlugins, discoverSkills } from "../harness/plugins.js";
 import { invalidateSandboxCache } from "../harness/sandbox.js";
+import { formatTrace, listTracedSessions, loadTrace } from "../harness/traces.js";
 import { invalidateVerificationCache } from "../harness/verification.js";
 import { normalizeMcpConfig } from "../mcp/config-normalize.js";
 import { connectedMcpServers, disconnectMcpClients, loadMcpTools } from "../mcp/loader.js";
@@ -47,6 +48,7 @@ export function registerInfoCommands(register, getCommandMap) {
                 "memory",
                 "doctor",
                 "hooks",
+                "traces",
                 "context",
                 "mcp",
                 "mcp-login",
@@ -358,6 +360,32 @@ export function registerInfoCommands(register, getCommandMap) {
     register("hooks", "List loaded hooks grouped by event", () => {
         return { output: formatHooksReport(getHooks()), handled: true };
     });
+    register("traces", "List sessions with persisted OTel-style traces (or show one with /traces <sessionId>)", (args) => {
+        const id = args.trim();
+        if (id) {
+            const spans = loadTrace(id);
+            if (spans.length === 0)
+                return { output: `No trace found for session ${id}.`, handled: true };
+            return { output: formatTrace(spans), handled: true };
+        }
+        const sessions = listTracedSessions();
+        if (sessions.length === 0) {
+            return {
+                output: "No persisted traces. Tracing is opt-in — start oh with OH_TRACE=1 to record spans to ~/.oh/traces/.",
+                handled: true,
+            };
+        }
+        const lines = [`${sessions.length} session(s) with traces (most recent first):`, ""];
+        for (const sid of sessions.slice(0, 20)) {
+            const spans = loadTrace(sid);
+            const totalMs = spans.reduce((sum, s) => sum + s.durationMs, 0);
+            const errors = spans.filter((s) => s.status === "error").length;
+            const errSuffix = errors > 0 ? ` ${errors} error(s)` : "";
+            lines.push(`  ${sid}  ${spans.length} spans, ${totalMs}ms total${errSuffix}`);
+        }
+        lines.push("", "Run `/traces <sessionId>` to see the full span tree.");
+        return { output: lines.join("\n"), handled: true };
+    });
     register("context", "Show context window usage breakdown", (_args, ctx) => {
         const ctxWindow = getContextWindow(ctx.model);
         let userTokens = 0, assistantTokens = 0, toolTokens = 0, systemTokens = 0;

package/dist/harness/traces.d.ts CHANGED Viewed

@@ -22,16 +22,23 @@ export type TraceEvent = {
     timestamp: number;
     attributes?: Record<string, unknown>;
 };
+export type OTLPConfig = {
+    endpoint: string;
+    headers?: Record<string, string>;
+};
 export declare class SessionTracer {
     private sessionId;
     private spans;
     private activeSpans;
     private spanCounter;
-    constructor(sessionId: string);
+    private otlp?;
+    constructor(sessionId: string, otlp?: OTLPConfig);
     /** Start a new span. Returns the span ID. */
     startSpan(name: string, attributes?: Record<string, unknown>, parentSpanId?: string): string;
     /** End a span and record it. */
     endSpan(spanId: string, status?: "ok" | "error", extraAttributes?: Record<string, unknown>): TraceSpan | null;
+    /** Fire-and-forget POST of a single span to the configured OTLP HTTP endpoint. Errors swallowed — telemetry must never crash the agent. */
+    private shipSpanOTLP;
     /** Get all completed spans */
     getSpans(): TraceSpan[];
     /** Get a summary of the trace */

package/dist/harness/traces.js CHANGED Viewed

@@ -18,8 +18,10 @@ export class SessionTracer {
     spans = [];
     activeSpans = new Map();
     spanCounter = 0;
-    constructor(sessionId) {
+    otlp;
+    constructor(sessionId, otlp) {
         this.sessionId = sessionId;
+        this.otlp = otlp;
     }
     /** Start a new span. Returns the span ID. */
     startSpan(name, attributes = {}, parentSpanId) {
@@ -50,8 +52,23 @@ export class SessionTracer {
             this.spans = this.spans.slice(-MAX_IN_MEMORY_SPANS);
         }
         this.persistSpan(span);
+        if (this.otlp)
+            this.shipSpanOTLP(span);
         return span;
     }
+    /** Fire-and-forget POST of a single span to the configured OTLP HTTP endpoint. Errors swallowed — telemetry must never crash the agent. */
+    shipSpanOTLP(span) {
+        if (!this.otlp)
+            return;
+        const payload = exportTraceOTLP(this.sessionId, [span]);
+        fetch(this.otlp.endpoint, {
+            method: "POST",
+            headers: { "Content-Type": "application/json", ...(this.otlp.headers ?? {}) },
+            body: JSON.stringify(payload),
+        }).catch(() => {
+            /* swallow — telemetry must not interfere with the agent */
+        });
+    }
     /** Get all completed spans */
     getSpans() {
         return [...this.spans];

package/dist/query/index.js CHANGED Viewed

@@ -41,6 +41,11 @@ export async function* query(userMessage, config, existingMessages = []) {
     const maxTurns = config.maxTurns ?? DEFAULT_MAX_TURNS;
     const routerCfg = readOhConfig()?.modelRouter ?? {};
     const router = new ModelRouter(routerCfg, config.model ?? "");
+    const querySpanId = config.tracer?.startSpan("query", {
+        model: config.model,
+        permissionMode: config.permissionMode,
+        toolCount: config.tools.length,
+    });
     const toolContext = {
         workingDir: config.workingDir ?? process.cwd(),
         abortSignal: config.abortSignal,
@@ -51,6 +56,8 @@ export async function* query(userMessage, config, existingMessages = []) {
         permissionMode: config.permissionMode,
         askUserQuestion: config.askUserQuestion,
         gitCommitPerTool: config.gitCommitPerTool,
+        tracer: config.tracer,
+        parentSpanId: querySpanId,
     };
     const estimateTokens = makeTokenEstimator(config.provider);
     const contextManager = new ContextManager(undefined, config.model);
@@ -99,224 +106,230 @@ export async function* query(userMessage, config, existingMessages = []) {
         consecutiveErrors: 0,
     };
     // ── Main loop ──
-    while (state.turn < maxTurns) {
-        state.turn++;
-        if (config.abortSignal?.aborted) {
-            yield { type: "turn_complete", reason: "aborted" };
-            return;
-        }
-        if (config.maxCost && config.maxCost > 0 && state.totalCost >= config.maxCost) {
-            yield { type: "error", message: `Budget exceeded: $${state.totalCost.toFixed(4)}` };
-            yield { type: "turn_complete", reason: "budget_exceeded" };
-            return;
-        }
-        // Context window management
-        // ── Context window management with circuit breaker ──
-        const contextWindow = getContextWindow(config.model);
-        const estimatedTokens = estimateMessagesTokens(state.messages, estimateTokens);
-        const MAX_COMPRESSION_FAILURES = 3;
-        if (estimatedTokens > contextWindow * 0.8 && (state.compressionFailures ?? 0) < MAX_COMPRESSION_FAILURES) {
-            const tokensBefore = estimatedTokens;
-            let strategy = "basic";
-            state.messages = compressMessages(state.messages, Math.floor(contextWindow * 0.6));
-            const afterBasic = estimateMessagesTokens(state.messages, estimateTokens);
-            if (afterBasic > contextWindow * 0.7 && state.messages.length > 4) {
-                try {
-                    state.messages = await summarizeConversation(config.provider, state.messages, config.model, Math.floor(contextWindow * 0.5));
-                    strategy = "llm-summarization";
-                    state.compressionFailures = 0; // Reset on success
+    try {
+        while (state.turn < maxTurns) {
+            state.turn++;
+            if (config.abortSignal?.aborted) {
+                yield { type: "turn_complete", reason: "aborted" };
+                return;
+            }
+            if (config.maxCost && config.maxCost > 0 && state.totalCost >= config.maxCost) {
+                yield { type: "error", message: `Budget exceeded: $${state.totalCost.toFixed(4)}` };
+                yield { type: "turn_complete", reason: "budget_exceeded" };
+                return;
+            }
+            // Context window management
+            // ── Context window management with circuit breaker ──
+            const contextWindow = getContextWindow(config.model);
+            const estimatedTokens = estimateMessagesTokens(state.messages, estimateTokens);
+            const MAX_COMPRESSION_FAILURES = 3;
+            if (estimatedTokens > contextWindow * 0.8 && (state.compressionFailures ?? 0) < MAX_COMPRESSION_FAILURES) {
+                const tokensBefore = estimatedTokens;
+                let strategy = "basic";
+                state.messages = compressMessages(state.messages, Math.floor(contextWindow * 0.6));
+                const afterBasic = estimateMessagesTokens(state.messages, estimateTokens);
+                if (afterBasic > contextWindow * 0.7 && state.messages.length > 4) {
+                    try {
+                        state.messages = await summarizeConversation(config.provider, state.messages, config.model, Math.floor(contextWindow * 0.5));
+                        strategy = "llm-summarization";
+                        state.compressionFailures = 0; // Reset on success
+                    }
+                    catch {
+                        state.compressionFailures = (state.compressionFailures ?? 0) + 1;
+                        strategy = "basic-only (llm failed)";
+                    }
                 }
-                catch {
-                    state.compressionFailures = (state.compressionFailures ?? 0) + 1;
-                    strategy = "basic-only (llm failed)";
+                const tokensAfter = estimateMessagesTokens(state.messages, estimateTokens);
+                yield {
+                    type: "error",
+                    message: `Context compressed (${strategy}): ${tokensBefore} → ${tokensAfter} tokens. Re-read any files you need.`,
+                };
+            }
+            else if (estimatedTokens > contextWindow * 0.8) {
+                yield {
+                    type: "error",
+                    message: "Context compression disabled (3 consecutive failures). Consider starting a new session.",
+                };
+            }
+            // ── Dynamic prompt: refresh memories if changed, inject warnings ──
+            try {
+                const { memoryVersion, loadActiveMemories, memoriesToPrompt } = await import("../harness/memory.js");
+                const currentVer = memoryVersion();
+                if (currentVer > lastMemoryVer) {
+                    const fresh = memoriesToPrompt(loadActiveMemories());
+                    // Replace or append memory section in fullSystemPrompt
+                    if (fullSystemPrompt.includes("# Remembered Context")) {
+                        fullSystemPrompt = fullSystemPrompt.replace(/# Remembered Context[\s\S]*?(?=\n# |$)/, fresh);
+                    }
+                    else if (fresh) {
+                        fullSystemPrompt += `\n\n${fresh}`;
+                    }
+                    lastMemoryVer = currentVer;
                 }
             }
-            const tokensAfter = estimateMessagesTokens(state.messages, estimateTokens);
-            yield {
-                type: "error",
-                message: `Context compressed (${strategy}): ${tokensBefore} → ${tokensAfter} tokens. Re-read any files you need.`,
-            };
-        }
-        else if (estimatedTokens > contextWindow * 0.8) {
-            yield {
-                type: "error",
-                message: "Context compression disabled (3 consecutive failures). Consider starting a new session.",
-            };
-        }
-        // ── Dynamic prompt: refresh memories if changed, inject warnings ──
-        try {
-            const { memoryVersion, loadActiveMemories, memoriesToPrompt } = await import("../harness/memory.js");
-            const currentVer = memoryVersion();
-            if (currentVer > lastMemoryVer) {
-                const fresh = memoriesToPrompt(loadActiveMemories());
-                // Replace or append memory section in fullSystemPrompt
-                if (fullSystemPrompt.includes("# Remembered Context")) {
-                    fullSystemPrompt = fullSystemPrompt.replace(/# Remembered Context[\s\S]*?(?=\n# |$)/, fresh);
+            catch {
+                /* memory refresh optional */
+            }
+            let turnPrompt = fullSystemPrompt;
+            if (config.maxCost && config.maxCost > 0) {
+                const pct = state.totalCost / config.maxCost;
+                if (pct >= 0.9) {
+                    turnPrompt += `\n\n⚠️ BUDGET CRITICAL: Only $${(config.maxCost - state.totalCost).toFixed(4)} remaining. Provide final response NOW.`;
                 }
-                else if (fresh) {
-                    fullSystemPrompt += `\n\n${fresh}`;
+                else if (pct >= 0.7) {
+                    turnPrompt += `\n\n⚠️ BUDGET WARNING: ${Math.round((1 - pct) * 100)}% budget remaining. Start consolidating.`;
                 }
-                lastMemoryVer = currentVer;
             }
-        }
-        catch {
-            /* memory refresh optional */
-        }
-        let turnPrompt = fullSystemPrompt;
-        if (config.maxCost && config.maxCost > 0) {
-            const pct = state.totalCost / config.maxCost;
-            if (pct >= 0.9) {
-                turnPrompt += `\n\n⚠️ BUDGET CRITICAL: Only $${(config.maxCost - state.totalCost).toFixed(4)} remaining. Provide final response NOW.`;
+            if (state.turn >= maxTurns * 0.9 && maxTurns > 1) {
+                turnPrompt += `\n\n⚠️ TURN LIMIT: ${maxTurns - state.turn} turn(s) remaining. Wrap up.`;
             }
-            else if (pct >= 0.7) {
-                turnPrompt += `\n\n⚠️ BUDGET WARNING: ${Math.round((1 - pct) * 100)}% budget remaining. Start consolidating.`;
-            }
-        }
-        if (state.turn >= maxTurns * 0.9 && maxTurns > 1) {
-            turnPrompt += `\n\n⚠️ TURN LIMIT: ${maxTurns - state.turn} turn(s) remaining. Wrap up.`;
-        }
-        // ── LLM call with streaming ──
-        let assistantContent = "";
-        const toolCalls = [];
-        let streamError = null;
-        const streamingExecutor = new StreamingToolExecutor(config.tools, toolContext, config.permissionMode, config.askUser, config.abortSignal);
-        try {
-            const ctxUsage = estimateRouteContextUsage(state.messages, config.provider, config.model ?? "");
-            const selection = router.select({
-                turn: state.turn,
-                hadToolCalls: state.lastTurnHadTools ?? false,
-                toolCallCount: state.lastTurnToolCount ?? 0,
-                contextUsage: ctxUsage,
-                isFinalResponse: (state.lastTurnHadTools === false || state.lastTurnHadTools === undefined) && state.turn > 1,
-                role: config.role,
-            });
-            for await (const event of config.provider.stream(state.messages, turnPrompt, apiTools, selection.model)) {
-                if (config.abortSignal?.aborted)
-                    break;
-                switch (event.type) {
-                    case "text_delta":
-                        assistantContent += event.content;
-                        yield event;
-                        break;
-                    case "tool_call_start":
-                        toolCalls.push({ id: event.callId, toolName: event.toolName, arguments: {} });
-                        yield event;
+            // ── LLM call with streaming ──
+            let assistantContent = "";
+            const toolCalls = [];
+            let streamError = null;
+            const streamingExecutor = new StreamingToolExecutor(config.tools, toolContext, config.permissionMode, config.askUser, config.abortSignal);
+            try {
+                const ctxUsage = estimateRouteContextUsage(state.messages, config.provider, config.model ?? "");
+                const selection = router.select({
+                    turn: state.turn,
+                    hadToolCalls: state.lastTurnHadTools ?? false,
+                    toolCallCount: state.lastTurnToolCount ?? 0,
+                    contextUsage: ctxUsage,
+                    isFinalResponse: (state.lastTurnHadTools === false || state.lastTurnHadTools === undefined) && state.turn > 1,
+                    role: config.role,
+                });
+                for await (const event of config.provider.stream(state.messages, turnPrompt, apiTools, selection.model)) {
+                    if (config.abortSignal?.aborted)
                         break;
-                    case "tool_call_complete": {
-                        const tc = toolCalls.find((t) => t.id === event.callId);
-                        if (tc) {
-                            const idx = toolCalls.indexOf(tc);
-                            toolCalls[idx] = { ...tc, arguments: event.arguments };
+                    switch (event.type) {
+                        case "text_delta":
+                            assistantContent += event.content;
+                            yield event;
+                            break;
+                        case "tool_call_start":
+                            toolCalls.push({ id: event.callId, toolName: event.toolName, arguments: {} });
+                            yield event;
+                            break;
+                        case "tool_call_complete": {
+                            const tc = toolCalls.find((t) => t.id === event.callId);
+                            if (tc) {
+                                const idx = toolCalls.indexOf(tc);
+                                toolCalls[idx] = { ...tc, arguments: event.arguments };
+                            }
+                            if (streamingExecutor) {
+                                streamingExecutor.addTool({ id: event.callId, toolName: event.toolName, arguments: event.arguments });
+                            }
+                            break;
                         }
-                        if (streamingExecutor) {
-                            streamingExecutor.addTool({ id: event.callId, toolName: event.toolName, arguments: event.arguments });
-                        }
-                        break;
+                        case "cost_update":
+                            state.totalCost += event.cost;
+                            state.totalInputTokens += event.inputTokens;
+                            state.totalOutputTokens += event.outputTokens;
+                            yield event;
+                            break;
+                        case "error":
+                            yield event;
+                            break;
                     }
-                    case "cost_update":
-                        state.totalCost += event.cost;
-                        state.totalInputTokens += event.inputTokens;
-                        state.totalOutputTokens += event.outputTokens;
-                        yield event;
-                        break;
-                    case "error":
-                        yield event;
-                        break;
                 }
+                state.consecutiveErrors = 0;
             }
-            state.consecutiveErrors = 0;
-        }
-        catch (err) {
-            streamError = err instanceof Error ? err : new Error(String(err));
-            state.consecutiveErrors++;
-            // Circuit breaker
-            if (state.consecutiveErrors >= MAX_CONSECUTIVE_ERRORS) {
-                yield {
-                    type: "error",
-                    message: `Too many consecutive errors (${state.consecutiveErrors}): ${streamError.message}`,
-                };
+            catch (err) {
+                streamError = err instanceof Error ? err : new Error(String(err));
+                state.consecutiveErrors++;
+                // Circuit breaker
+                if (state.consecutiveErrors >= MAX_CONSECUTIVE_ERRORS) {
+                    yield {
+                        type: "error",
+                        message: `Too many consecutive errors (${state.consecutiveErrors}): ${streamError.message}`,
+                    };
+                    yield { type: "turn_complete", reason: "error" };
+                    return;
+                }
+                // Error recovery cascade
+                if (isRateLimitError(streamError) || isOverloadError(streamError)) {
+                    const attempt = state.consecutiveErrors;
+                    const isOverload = isOverloadError(streamError);
+                    if (attempt <= MAX_RATE_LIMIT_RETRIES) {
+                        const baseRetry = 2 ** attempt * (isOverload ? 2 : 1);
+                        const retryIn = baseRetry * (0.5 + Math.random());
+                        yield { type: "rate_limited", retryIn: Math.round(retryIn), attempt };
+                        await new Promise((r) => setTimeout(r, retryIn * 1000));
+                        continue;
+                    }
+                    yield {
+                        type: "error",
+                        message: `${isOverload ? "Server overloaded" : "Rate limit exceeded"} after ${MAX_RATE_LIMIT_RETRIES} retries.`,
+                    };
+                    yield { type: "turn_complete", reason: "error" };
+                    return;
+                }
+                if (isPromptTooLongError(streamError)) {
+                    state.promptTooLongRetries = (state.promptTooLongRetries ?? 0) + 1;
+                    if (state.promptTooLongRetries > 2) {
+                        yield { type: "error", message: "Context still too long after 2 compression attempts." };
+                        yield { type: "turn_complete", reason: "error" };
+                        return;
+                    }
+                    state.messages = compressMessages(state.messages, Math.floor(contextWindow * 0.5));
+                    state.transition = "retry_prompt_too_long";
+                    yield { type: "error", message: "Context too long, compressing history..." };
+                    continue;
+                }
+                if (isNetworkError(streamError)) {
+                    state.transition = "retry_network";
+                    const delay = 1000 * 2 ** (state.consecutiveErrors - 1);
+                    yield { type: "error", message: `Network error, retrying in ${delay / 1000}s...` };
+                    await new Promise((r) => setTimeout(r, delay));
+                    continue;
+                }
+                yield { type: "error", message: streamError.message };
                 yield { type: "turn_complete", reason: "error" };
                 return;
             }
-            // Error recovery cascade
-            if (isRateLimitError(streamError) || isOverloadError(streamError)) {
-                const attempt = state.consecutiveErrors;
-                const isOverload = isOverloadError(streamError);
-                if (attempt <= MAX_RATE_LIMIT_RETRIES) {
-                    const baseRetry = 2 ** attempt * (isOverload ? 2 : 1);
-                    const retryIn = baseRetry * (0.5 + Math.random());
-                    yield { type: "rate_limited", retryIn: Math.round(retryIn), attempt };
-                    await new Promise((r) => setTimeout(r, retryIn * 1000));
-                    continue;
-                }
+            if (config.abortSignal?.aborted) {
+                yield { type: "turn_complete", reason: "aborted" };
+                return;
+            }
+            if (assistantContent === "" && toolCalls.length === 0) {
                 yield {
                     type: "error",
-                    message: `${isOverload ? "Server overloaded" : "Rate limit exceeded"} after ${MAX_RATE_LIMIT_RETRIES} retries.`,
+                    message: "No response received. Check that your model server is running and the model name is correct.",
                 };
-                yield { type: "turn_complete", reason: "error" };
                 return;
             }
-            if (isPromptTooLongError(streamError)) {
-                state.promptTooLongRetries = (state.promptTooLongRetries ?? 0) + 1;
-                if (state.promptTooLongRetries > 2) {
-                    yield { type: "error", message: "Context still too long after 2 compression attempts." };
-                    yield { type: "turn_complete", reason: "error" };
-                    return;
-                }
-                state.messages = compressMessages(state.messages, Math.floor(contextWindow * 0.5));
-                state.transition = "retry_prompt_too_long";
-                yield { type: "error", message: "Context too long, compressing history..." };
-                continue;
+            state.messages.push(createAssistantMessage(assistantContent, toolCalls.length > 0 ? toolCalls : undefined));
+            if (toolCalls.length === 0) {
+                yield { type: "turn_complete", reason: "completed" };
+                return;
             }
-            if (isNetworkError(streamError)) {
-                state.transition = "retry_network";
-                const delay = 1000 * 2 ** (state.consecutiveErrors - 1);
-                yield { type: "error", message: `Network error, retrying in ${delay / 1000}s...` };
-                await new Promise((r) => setTimeout(r, delay));
-                continue;
+            // Collect streaming tool results
+            await streamingExecutor.waitForAll();
+            const completedResults = [...streamingExecutor.getCompletedResults()];
+            const executedIds = new Set(completedResults.map((r) => r.toolCall.id));
+            for (const { callId, chunk } of streamingExecutor.outputChunks) {
+                yield { type: "tool_output_delta", callId, chunk };
             }
-            yield { type: "error", message: streamError.message };
-            yield { type: "turn_complete", reason: "error" };
-            return;
-        }
-        if (config.abortSignal?.aborted) {
-            yield { type: "turn_complete", reason: "aborted" };
-            return;
-        }
-        if (assistantContent === "" && toolCalls.length === 0) {
-            yield {
-                type: "error",
-                message: "No response received. Check that your model server is running and the model name is correct.",
-            };
-            return;
-        }
-        state.messages.push(createAssistantMessage(assistantContent, toolCalls.length > 0 ? toolCalls : undefined));
-        if (toolCalls.length === 0) {
-            yield { type: "turn_complete", reason: "completed" };
-            return;
-        }
-        // Collect streaming tool results
-        await streamingExecutor.waitForAll();
-        const completedResults = [...streamingExecutor.getCompletedResults()];
-        const executedIds = new Set(completedResults.map((r) => r.toolCall.id));
-        for (const { callId, chunk } of streamingExecutor.outputChunks) {
-            yield { type: "tool_output_delta", callId, chunk };
-        }
-        for (const { toolCall: tc, result } of completedResults) {
-            yield { type: "tool_call_end", callId: tc.id, output: result.output, isError: result.isError };
-            // Apply context budget to tool output
-            const budgetedOutput = contextManager.enforceToolBudget(tc.toolName, result.output);
-            state.messages.push(createToolResultMessage({ callId: tc.id, output: budgetedOutput, isError: result.isError }));
-        }
-        // Execute remaining tools not started during streaming
-        const remaining = toolCalls.filter((tc) => !executedIds.has(tc.id));
-        if (remaining.length > 0) {
-            yield* executeToolCalls(remaining, config.tools, toolContext, config.permissionMode, config.askUser, state, config.permissionPromptTool);
+            for (const { toolCall: tc, result } of completedResults) {
+                yield { type: "tool_call_end", callId: tc.id, output: result.output, isError: result.isError };
+                // Apply context budget to tool output
+                const budgetedOutput = contextManager.enforceToolBudget(tc.toolName, result.output);
+                state.messages.push(createToolResultMessage({ callId: tc.id, output: budgetedOutput, isError: result.isError }));
+            }
+            // Execute remaining tools not started during streaming
+            const remaining = toolCalls.filter((tc) => !executedIds.has(tc.id));
+            if (remaining.length > 0) {
+                yield* executeToolCalls(remaining, config.tools, toolContext, config.permissionMode, config.askUser, state, config.permissionPromptTool);
+            }
+            state.lastTurnHadTools = toolCalls.length > 0;
+            state.lastTurnToolCount = toolCalls.length;
+            state.transition = "next_turn";
         }
-        state.lastTurnHadTools = toolCalls.length > 0;
-        state.lastTurnToolCount = toolCalls.length;
-        state.transition = "next_turn";
+        yield { type: "turn_complete", reason: "max_turns" };
+    }
+    finally {
+        if (querySpanId)
+            config.tracer?.endSpan(querySpanId, "ok", { turns: state.turn });
     }
-    yield { type: "turn_complete", reason: "max_turns" };
 }
 //# sourceMappingURL=index.js.map

package/dist/query/tools.js CHANGED Viewed

@@ -216,6 +216,7 @@ export async function executeSingleTool(toolCall, tools, context, permissionMode
         return { output: "Blocked by preToolUse hook.", isError: true };
     }
     // Execute with timeout and result budgeting
+    const toolSpanId = context.tracer?.startSpan(`tool:${tool.name}`, { riskLevel: tool.riskLevel }, context.parentSpanId);
     try {
         const toolAbort = AbortSignal.timeout(TOOL_TIMEOUT_MS);
         const contextWithTimeout = { ...context, abortSignal: context.abortSignal ?? toolAbort };
@@ -225,6 +226,8 @@ export async function executeSingleTool(toolCall, tools, context, permissionMode
                 toolAbort.addEventListener("abort", () => reject(new Error(`Tool '${tool.name}' timed out after ${TOOL_TIMEOUT_MS / 1000}s`)));
             }),
         ]);
+        if (toolSpanId)
+            context.tracer?.endSpan(toolSpanId, result.isError ? "error" : "ok");
         // Hook: postToolUse / postToolUseFailure (mutually exclusive — strict CC parity)
         if (result.isError) {
             emitHook("postToolUseFailure", {
@@ -300,6 +303,8 @@ export async function executeSingleTool(toolCall, tools, context, permissionMode
     catch (err) {
         const errMsg = err instanceof Error ? err.message : String(err);
         const errName = err instanceof Error ? err.name : "ExecutionError";
+        if (toolSpanId)
+            context.tracer?.endSpan(toolSpanId, "error", { error: errMsg });
         emitHook("postToolUseFailure", {
             toolName: tool.name,
             toolArgs: JSON.stringify(toolCall.arguments).slice(0, 1000),

package/dist/query/types.d.ts CHANGED Viewed

@@ -1,6 +1,7 @@
 /**
  * Shared types for the query loop sub-modules.
  */
+import type { SessionTracer } from "../harness/traces.js";
 import type { Provider } from "../providers/base.js";
 import type { Tools } from "../Tool.js";
 import type { Message } from "../types/message.js";
@@ -32,6 +33,8 @@ export type QueryConfig = {
      * the tool is missing, throws, or returns malformed JSON.
      */
     permissionPromptTool?: string;
+    /** Optional session tracer. When set, query() emits `query` and `tool:<Name>` spans. */
+    tracer?: SessionTracer;
 };
 export type TransitionReason = "next_turn" | "retry_network" | "retry_prompt_too_long" | "retry_max_output_tokens";
 export type QueryLoopState = {

package/dist/repl.js CHANGED Viewed

@@ -64,6 +64,26 @@ export async function startREPL(config) {
     // Initialize checkpoints for file rewind
     const { initCheckpoints } = await import("./harness/checkpoints.js");
     initCheckpoints(session.id);
+    // Optional session-wide tracer. Opt-in via OH_TRACE=1 env var.
+    // Persists OTel-style spans to ~/.oh/traces/<sessionId>.jsonl.
+    // When OH_OTLP_ENDPOINT is also set, ships each ended span via fire-and-forget
+    // HTTP POST to the configured collector (Jaeger, Honeycomb, Grafana Tempo, etc.).
+    // OH_OTLP_HEADERS is a JSON-encoded headers object, e.g. '{"Authorization":"Bearer ..."}'.
+    let tracer;
+    if (process.env.OH_TRACE === "1") {
+        const { SessionTracer } = await import("./harness/traces.js");
+        const otlpEndpoint = process.env.OH_OTLP_ENDPOINT;
+        let otlpHeaders;
+        if (process.env.OH_OTLP_HEADERS) {
+            try {
+                otlpHeaders = JSON.parse(process.env.OH_OTLP_HEADERS);
+            }
+            catch {
+                /* malformed JSON in env — skip headers, ship without auth */
+            }
+        }
+        tracer = new SessionTracer(session.id, otlpEndpoint ? { endpoint: otlpEndpoint, headers: otlpHeaders } : undefined);
+    }
     // Start background cron executor
     const { CronExecutor } = await import("./services/CronExecutor.js");
     const cronExecutor = new CronExecutor(config.provider, config.tools, config.systemPrompt, config.permissionMode, config.model);
@@ -900,6 +920,7 @@ export async function startREPL(config) {
             askUserQuestion,
             model: currentModel || undefined,
             abortSignal: abortController.signal,
+            tracer,
         };
         try {
             for await (const event of query(prompt, queryConfig, messages)) {

package/dist/services/StreamingToolExecutor.js CHANGED Viewed

@@ -94,8 +94,11 @@ export class StreamingToolExecutor {
                 this.outputChunks.push({ callId: id, chunk });
             },
         };
+        const toolSpanId = callContext.tracer?.startSpan(`tool:${tool.name}`, { riskLevel: tool.riskLevel }, callContext.parentSpanId);
         try {
             tracked.result = await tool.call(parsed.data, callContext);
+            if (toolSpanId)
+                callContext.tracer?.endSpan(toolSpanId, tracked.result.isError ? "error" : "ok");
             // Verification loop: auto-run lint/typecheck after file-modifying tools
             if (tracked.result && !tracked.result.isError && ["Edit", "Write", "MultiEdit"].includes(tool.name)) {
                 try {
@@ -132,6 +135,8 @@ export class StreamingToolExecutor {
                 output: `Error: ${err instanceof Error ? err.message : String(err)}`,
                 isError: true,
             };
+            if (toolSpanId)
+                callContext.tracer?.endSpan(toolSpanId, "error", { error: tracked.result.output });
         }
         tracked.status = "completed";
         this.processQueue(); // Process next queued tools

package/dist/tools/AgentTool/index.js CHANGED Viewed

@@ -165,10 +165,10 @@ export const AgentTool = {
                     }
                     else if (event.type === "tool_output_delta") {
                         outputChunks.push(event.chunk);
-                        if (context.onOutputChunk && context.callId) {
+                        const forwarded = forwardInnerEvent(event, context);
+                        if (!forwarded && context.onOutputChunk && context.callId) {
                             context.onOutputChunk(context.callId, event.chunk);
                         }
-                        forwardInnerEvent(event, context);
                     }
                     else if (event.type === "tool_call_start" ||
                         event.type === "tool_call_complete" ||

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@zhijiewang/openharness",
-  "version": "2.28.0",
+  "version": "2.30.0",
   "description": "Open-source terminal coding agent. Works with any LLM.",
   "type": "module",
   "bin": {