npm - @semalt-ai/code - Versions diffs - 1.8.5 → 1.19.0 - Mend

@semalt-ai/code 1.8.5 → 1.19.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (146) hide show

package/.claude/settings.local.json +6 -1
package/.github/workflows/ci.yml +69 -0
package/CLAUDE.md +1584 -26
package/README.md +147 -3
package/examples/embed.js +74 -0
package/index.js +251 -10
package/lib/agent.js +711 -104
package/lib/api.js +213 -49
package/lib/args.js +74 -2
package/lib/audit.js +23 -1
package/lib/background.js +584 -0
package/lib/checkpoints.js +757 -0
package/lib/commands/auth.js +94 -0
package/lib/commands/chat-session.js +306 -0
package/lib/commands/chat-slash.js +399 -0
package/lib/commands/chat-turn.js +446 -0
package/lib/commands/chat.js +403 -0
package/lib/commands/custom.js +157 -0
package/lib/commands/history-utils.js +66 -0
package/lib/commands/index.js +268 -0
package/lib/commands/mcp.js +113 -0
package/lib/commands/oneshot.js +193 -0
package/lib/commands/registry.js +269 -0
package/lib/commands/tasks.js +89 -0
package/lib/compact.js +87 -0
package/lib/config.js +333 -11
package/lib/constants.js +372 -3
package/lib/deny.js +199 -0
package/lib/doctor.js +160 -0
package/lib/headless.js +167 -0
package/lib/hooks.js +286 -0
package/lib/images.js +264 -0
package/lib/internals.js +49 -0
package/lib/mcp/boundary.js +131 -0
package/lib/mcp/client.js +270 -0
package/lib/mcp/oauth.js +134 -0
package/lib/memory.js +209 -0
package/lib/metrics.js +37 -2
package/lib/payload.js +54 -0
package/lib/permission-rules.js +401 -0
package/lib/permissions.js +100 -10
package/lib/pricing.js +67 -0
package/lib/proc.js +62 -0
package/lib/prompts.js +84 -5
package/lib/sandbox.js +568 -0
package/lib/sdk.js +328 -0
package/lib/secrets.js +211 -0
package/lib/skills.js +223 -0
package/lib/subagents.js +516 -0
package/lib/tool_registry.js +2558 -0
package/lib/tool_specs.js +222 -2
package/lib/tools.js +272 -1020
package/lib/ui/format.js +22 -1
package/lib/ui/input-field.js +16 -7
package/lib/ui/status-bar.js +79 -11
package/lib/ui/theme.js +1 -0
package/lib/ui/web-activity.js +218 -0
package/lib/verify.js +229 -0
package/lib/web-extract.js +213 -0
package/lib/web-summarize.js +68 -0
package/package.json +19 -4
package/scripts/lint.js +57 -0
package/test/agent-loop.test.js +389 -0
package/test/background.test.js +414 -0
package/test/chat.test.js +114 -0
package/test/checkpoints-agent.test.js +181 -0
package/test/checkpoints.test.js +650 -0
package/test/command-registry.test.js +160 -0
package/test/compact.test.js +116 -0
package/test/completion-lazy.test.js +52 -0
package/test/config-merge.test.js +324 -0
package/test/config-quarantine.test.js +128 -0
package/test/config-write-guard-allow-anywhere.test.js +56 -0
package/test/config-write-guard-skip.test.js +46 -0
package/test/config-write-guard.test.js +153 -0
package/test/context-split.test.js +215 -0
package/test/cost-doctor.test.js +142 -0
package/test/custom-commands-chat.test.js +106 -0
package/test/custom-commands.test.js +230 -0
package/test/deny-windows.test.js +120 -0
package/test/deny.test.js +83 -0
package/test/download-allow-anywhere.test.js +66 -0
package/test/download-confine.test.js +153 -0
package/test/executors.test.js +362 -0
package/test/extract-tool-calls.test.js +315 -0
package/test/fetch-url-validation.test.js +219 -0
package/test/fixtures/tool-calls.js +57 -0
package/test/fixtures/web-page.js +91 -0
package/test/git-tools.test.js +384 -0
package/test/grep-glob-serialize.test.js +242 -0
package/test/grep-glob.test.js +268 -0
package/test/harness/README.md +57 -0
package/test/harness/chat-harness.js +142 -0
package/test/harness/memwarn-headless-child.js +65 -0
package/test/harness/mock-llm.js +120 -0
package/test/harness/mock-mcp-server.js +142 -0
package/test/harness/sse-server.js +69 -0
package/test/headless.test.js +203 -0
package/test/history-utils.test.js +88 -0
package/test/hooks-agent.test.js +238 -0
package/test/hooks-verify-sandbox.test.js +232 -0
package/test/hooks.test.js +216 -0
package/test/http-get-user-agent.test.js +142 -0
package/test/images-api.test.js +208 -0
package/test/images.test.js +238 -0
package/test/max-iterations.test.js +216 -0
package/test/mcp-boundary.test.js +57 -0
package/test/mcp-client.test.js +267 -0
package/test/mcp-oauth.test.js +86 -0
package/test/memory-truncation-warning.test.js +222 -0
package/test/memory.test.js +198 -0
package/test/native-dispatch.test.js +356 -0
package/test/output-chokepoint.test.js +188 -0
package/test/path-guards.test.js +134 -0
package/test/payload.test.js +99 -0
package/test/permission-rules-agent.test.js +210 -0
package/test/permission-rules.test.js +297 -0
package/test/permissions.test.js +163 -0
package/test/plan-mode.test.js +167 -0
package/test/read-paginate.test.js +275 -0
package/test/readonly-tools.test.js +177 -0
package/test/result-cap.test.js +233 -0
package/test/sandbox-agent.test.js +147 -0
package/test/sandbox-integration.test.js +216 -0
package/test/sandbox.test.js +408 -0
package/test/sdk.test.js +234 -0
package/test/shell-output-cap.test.js +181 -0
package/test/skills-chat.test.js +110 -0
package/test/skills.test.js +295 -0
package/test/smoke.test.js +68 -0
package/test/status-bar-pause.test.js +164 -0
package/test/stream-parser.test.js +147 -0
package/test/subagents-agent.test.js +178 -0
package/test/subagents.test.js +222 -0
package/test/tool-registry.test.js +85 -0
package/test/trim-budget.test.js +101 -0
package/test/verify-agent.test.js +317 -0
package/test/verify.test.js +141 -0
package/test/web-activity-ordering.test.js +194 -0
package/test/web-activity.test.js +207 -0
package/test/web-data-extraction-guidance.test.js +71 -0
package/test/web-extract.test.js +185 -0
package/test/web-fetch-agent.test.js +291 -0
package/test/web-fetch-mode.test.js +193 -0
package/test/web-search.test.js +380 -0
package/lib/commands.js +0 -1438

package/test/checkpoints-agent.test.js ADDED Viewed

@@ -0,0 +1,181 @@
+'use strict';
+// Integration tests for checkpoints (Task 4.3) driving the REAL executor +
+// runAgentLoop (and a REAL subagent loop) against the mock-LLM harness. Covers:
+//   * a write through the real loop is checkpointed post-gate/pre-mutation, with
+//     turn linkage, and is rewindable;
+//   * a DENIED tool call produces NO checkpoint;
+//   * a SUBAGENT's mutation is checkpointed into the PARENT session and is
+//     rewindable (subagents reuse the parent's agentExecFile).
+const { test, before, after, afterEach } = require('node:test');
+const assert = require('node:assert');
+const fs = require('fs');
+const os = require('os');
+const path = require('path');
+const ui = require('../lib/ui');
+const { createApiClient } = require('../lib/api');
+const { createToolExecutor, extractToolCalls } = require('../lib/tools');
+const { createPermissionManager } = require('../lib/permissions');
+const { createAgentRunner } = require('../lib/agent');
+const { createCheckpointStore } = require('../lib/checkpoints');
+const toolRegistry = require('../lib/tool_registry');
+const { createSubagentManager, buildSpawnAgentEntry } = require('../lib/subagents');
+const { startMockLLM } = require('./harness/mock-llm');
+let prevKey;
+before(() => { prevKey = process.env.SEMALT_API_KEY; process.env.SEMALT_API_KEY = 'test-key'; });
+after(() => {
+  if (prevKey === undefined) delete process.env.SEMALT_API_KEY;
+  else process.env.SEMALT_API_KEY = prevKey;
+});
+afterEach(() => { toolRegistry.clearDynamicTools(); });
+function tmpdir(tag = 'work') { return fs.mkdtempSync(path.join(os.tmpdir(), `semalt-cpa-${tag}-`)); }
+// Build a full stack (api + permissions + executor wired with a real checkpoint
+// store + agent runner). Optionally wires a subagent manager sharing the SAME
+// executor, so a child's mutations flow through the same checkpoint store.
+function buildStack(base, { skipPermissions = false, withSubagents = false } = {}) {
+  const config = {
+    api_base: base, api_key: 'test-key', default_model: 'test-model',
+    temperature: 0.5, request_timeout_ms: 5000, stream: true, models: [],
+    checkpoints: { enabled: true },
+  };
+  const getConfig = () => config;
+  const api = createApiClient({ getConfig, saveConfig: (c) => Object.assign(config, c), ui });
+  const pm = createPermissionManager(ui, { skipPermissions });
+  pm.setUICallbacks({ onAddMessage: () => {}, onShowModal: () => {}, onCloseModal: () => {}, onCaptureNavigation: () => () => {} });
+  const root = tmpdir('cproot');
+  const checkpointStore = createCheckpointStore({
+    getConfig, sessionId: 'agent-sess', rootDir: root, audit: { logCheckpoint: () => {} },
+  });
+  const { agentExecShell, agentExecFile, describePermission } = createToolExecutor(pm, ui, getConfig, { checkpointStore });
+  const runner = createAgentRunner({
+    chatStream: api.chatStream, extractToolCalls, agentExecShell, agentExecFile,
+    describePermission, permissionManager: pm, ui, getConfig, checkpoints: checkpointStore,
+  });
+  let manager = null;
+  if (withSubagents) {
+    manager = createSubagentManager({
+      chatStream: api.chatStream, extractToolCalls, agentExecShell, agentExecFile,
+      describePermission, permissionManager: pm, ui, getConfig, agentDefs: [],
+    });
+    toolRegistry.registerDynamicTool(buildSpawnAgentEntry(manager));
+  }
+  return { runner, manager, checkpointStore, root, config };
+}
+// ---------------------------------------------------------------------------
+// 1. A write through the real loop is checkpointed (post-gate) and rewindable
+// ---------------------------------------------------------------------------
+test('a top-level write is checkpointed with turn linkage and is rewindable', async () => {
+  const dir = tmpdir();
+  const file = path.join(dir, 'note.txt');
+  fs.writeFileSync(file, 'ORIGINAL');
+  // isPathSafe confines writes to the CWD — point it at the work dir.
+  const cwd0 = process.cwd();
+  process.chdir(dir);
+  const mock = await startMockLLM();
+  mock.replyWith(`<write_file path="${file}">REWRITTEN</write_file>`); // iter 0: the mutation
+  mock.replyWith('Done.');                                            // iter 1: final
+  try {
+    const { runner, checkpointStore } = buildStack(mock.base, { skipPermissions: true });
+    const messages = [{ role: 'user', content: 'rewrite the note' }];
+    await runner.runAgentLoop(messages, 'test-model', 5, null, { callbacks: { onError: () => {} } });
+    assert.strictEqual(fs.readFileSync(file, 'utf8'), 'REWRITTEN', 'the write happened');
+    const items = checkpointStore.list();
+    assert.strictEqual(items.length, 1, 'one checkpoint captured for the write');
+    const rec = checkpointStore._loadRecord(items[0].seq);
+    assert.strictEqual(rec.action, 'write');
+    assert.strictEqual(rec.targets[0].path, file);
+    // prior state was captured BEFORE the mutation
+    assert.strictEqual(Buffer.from(rec.targets[0].priorContentB64, 'base64').toString('utf8'), 'ORIGINAL');
+    // turn linkage recorded (forward-compat for conversation-rewind, Task 4.3b)
+    assert.strictEqual(rec.turn.turnId, 'turn-1');
+    assert.strictEqual(typeof rec.turn.messageCountAtStart, 'number');
+    // and it actually rewinds
+    const res = checkpointStore.rewind('last');
+    assert.ok(res.ok);
+    assert.strictEqual(fs.readFileSync(file, 'utf8'), 'ORIGINAL', 'rewind restored prior content');
+  } finally {
+    await mock.close();
+    process.chdir(cwd0);
+  }
+});
+// ---------------------------------------------------------------------------
+// 2. A denied tool call produces NO checkpoint
+// ---------------------------------------------------------------------------
+test('a denied write (non-TTY, no skip) is NOT checkpointed', async () => {
+  const dir = tmpdir();
+  const file = path.join(dir, 'blocked.txt');
+  const mock = await startMockLLM();
+  mock.replyWith(`<write_file path="${file}">SHOULD NOT WRITE</write_file>`); // denied at the gate
+  mock.replyWith('ok');
+  try {
+    // skipPermissions:false in a non-TTY env → the gate REFUSES the write, so
+    // the executor never runs and nothing is checkpointed.
+    const { runner, checkpointStore } = buildStack(mock.base, { skipPermissions: false });
+    const messages = [{ role: 'user', content: 'try to write' }];
+    await runner.runAgentLoop(messages, 'test-model', 5, null, { callbacks: { onError: () => {} } });
+    assert.ok(!fs.existsSync(file), 'the write was denied');
+    assert.strictEqual(checkpointStore.list().length, 0, 'no checkpoint for a denied call');
+  } finally {
+    await mock.close();
+  }
+});
+// ---------------------------------------------------------------------------
+// 3. A subagent's mutation is checkpointed in the PARENT session, rewindable
+// ---------------------------------------------------------------------------
+test('a subagent mutation is checkpointed in the parent session and is rewindable', async () => {
+  const dir = tmpdir();
+  const file = path.join(dir, 'child.txt');
+  fs.writeFileSync(file, 'BEFORE');
+  const cwd0 = process.cwd();
+  process.chdir(dir);
+  const mock = await startMockLLM();
+  // Parent dispatches spawn_agent; the child performs the write; child + parent
+  // each conclude. The child reuses the parent's agentExecFile, so its mutation
+  // flows through the SAME checkpoint store.
+  mock.replyWithToolCall('spawn_agent', { prompt: 'rewrite child.txt' }); // parent iter 0
+  mock.replyWith(`<write_file path="${file}">AFTER</write_file>`);        // child iter 0 (the mutation)
+  mock.replyWith('child done');                                          // child iter 1 (final)
+  mock.replyWith('parent done');                                         // parent iter 1 (final)
+  try {
+    const { runner, checkpointStore } = buildStack(mock.base, { skipPermissions: true, withSubagents: true });
+    const messages = [{ role: 'user', content: 'delegate a write' }];
+    await runner.runAgentLoop(messages, 'test-model', 6, null, { callbacks: { onError: () => {} } });
+    assert.strictEqual(fs.readFileSync(file, 'utf8'), 'AFTER', 'the child performed the write');
+    const items = checkpointStore.list();
+    assert.strictEqual(items.length, 1, "the child's write is checkpointed in the parent session");
+    const rec = checkpointStore._loadRecord(items[0].seq);
+    assert.strictEqual(rec.targets[0].path, file);
+    // linked to the parent's turn (the parent never reset turn context for the child)
+    assert.strictEqual(rec.turn.turnId, 'turn-1');
+    const res = checkpointStore.rewind('last');
+    assert.ok(res.ok);
+    assert.strictEqual(fs.readFileSync(file, 'utf8'), 'BEFORE', "a subagent's mutation is rewindable from the parent");
+  } finally {
+    await mock.close();
+    process.chdir(cwd0);
+  }
+});