npm - gsd-pi - Versions diffs - 2.60.0-dev.2580e65 → 2.60.0-dev.d9052f5 - Mend

gsd-pi 2.60.0-dev.2580e65 → 2.60.0-dev.d9052f5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (196) hide show

package/src/resources/extensions/gsd/tests/model-router.test.ts CHANGED Viewed

@@ -1,4 +1,4 @@
-import test, { describe } from "node:test";
+import test from "node:test";
 import assert from "node:assert/strict";
 import {
@@ -7,8 +7,6 @@ import {
   defaultRoutingConfig,
   scoreModel,
   computeTaskRequirements,
-  scoreEligibleModels,
-  getEligibleModels,
   MODEL_CAPABILITY_PROFILES,
 } from "../model-router.js";
 import type { DynamicRoutingConfig, RoutingDecision, ModelCapabilities } from "../model-router.js";
@@ -213,9 +211,9 @@ test("#2192: known model is still downgraded normally", () => {
 // ─── Capability Scoring (ADR-004 Phase 2) ───────────────────────────────────
-test("defaultRoutingConfig includes capability_routing: true", () => {
+test("defaultRoutingConfig includes capability_routing: false", () => {
   const config = defaultRoutingConfig();
-  assert.equal(config.capability_routing, true);
+  assert.equal(config.capability_routing, false);
 });
 test("scoreModel computes weighted average of capability × requirement", () => {
@@ -358,401 +356,3 @@ test("#2885: heavy openai-codex model downgrades to light for light task", () =>
   // Should pick a light-tier model
   assert.notEqual(result.modelId, "gpt-5.4", "should not use the heavy model for light task");
 });
-// ─── scoreModel ──────────────────────────────────────────────────────────────
-describe("scoreModel", () => {
-  const sonnetProfile: ModelCapabilities = MODEL_CAPABILITY_PROFILES["claude-sonnet-4-6"]!;
-  test("produces correct weighted average for two dimensions (coding:0.9, instruction:0.7)", () => {
-    // (0.9*85 + 0.7*85) / (0.9+0.7) = (76.5+59.5)/1.6 = 136/1.6 = 85.0
-    const score = scoreModel(sonnetProfile, { coding: 0.9, instruction: 0.7 });
-    assert.ok(Math.abs(score - 85.0) < 0.01, `Expected ~85.0, got ${score}`);
-  });
-  test("returns 50 when requirements is empty", () => {
-    const score = scoreModel(sonnetProfile, {});
-    assert.equal(score, 50);
-  });
-  test("returns correct score for single dimension coding:1.0", () => {
-    // coding=90 for claude-opus-4-6
-    const opusProfile = MODEL_CAPABILITY_PROFILES["claude-opus-4-6"]!;
-    const score = scoreModel(opusProfile, { coding: 1.0 });
-    assert.equal(score, 95);
-  });
-  test("handles all 7 dimensions correctly", () => {
-    // Uniform weight 1.0 on every dim → average of all dim values
-    const profile: ModelCapabilities = {
-      coding: 60, debugging: 60, research: 60, reasoning: 60,
-      speed: 60, longContext: 60, instruction: 60,
-    };
-    const reqs: Partial<Record<keyof ModelCapabilities, number>> = {
-      coding: 1.0, debugging: 1.0, research: 1.0, reasoning: 1.0,
-      speed: 1.0, longContext: 1.0, instruction: 1.0,
-    };
-    const score = scoreModel(profile, reqs);
-    assert.equal(score, 60);
-  });
-});
-// ─── computeTaskRequirements ─────────────────────────────────────────────────
-describe("computeTaskRequirements", () => {
-  test("execute-task with no metadata returns base vector", () => {
-    const req = computeTaskRequirements("execute-task", undefined);
-    assert.deepStrictEqual(req, { coding: 0.9, instruction: 0.7, speed: 0.3 });
-  });
-  test("execute-task with tags:['docs'] adjusts requirements", () => {
-    const req = computeTaskRequirements("execute-task", { tags: ["docs"] });
-    assert.equal(req.instruction, 0.9);
-    assert.equal(req.coding, 0.3);
-    assert.equal(req.speed, 0.7);
-  });
-  test("execute-task with tags:['config'] adjusts requirements", () => {
-    const req = computeTaskRequirements("execute-task", { tags: ["config"] });
-    assert.equal(req.instruction, 0.9);
-  });
-  test("execute-task with complexityKeywords:['concurrency'] boosts debugging and reasoning", () => {
-    const req = computeTaskRequirements("execute-task", { complexityKeywords: ["concurrency"] });
-    assert.equal(req.debugging, 0.9);
-    assert.equal(req.reasoning, 0.8);
-  });
-  test("execute-task with complexityKeywords:['migration'] boosts reasoning and coding", () => {
-    const req = computeTaskRequirements("execute-task", { complexityKeywords: ["migration"] });
-    assert.equal(req.reasoning, 0.9);
-    assert.equal(req.coding, 0.8);
-  });
-  test("execute-task with fileCount:8 boosts coding and reasoning", () => {
-    const req = computeTaskRequirements("execute-task", { fileCount: 8 });
-    assert.equal(req.coding, 0.9);
-    assert.equal(req.reasoning, 0.7);
-  });
-  test("execute-task with estimatedLines:600 boosts coding and reasoning", () => {
-    const req = computeTaskRequirements("execute-task", { estimatedLines: 600 });
-    assert.equal(req.coding, 0.9);
-    assert.equal(req.reasoning, 0.7);
-  });
-  test("research-milestone returns correct base vector", () => {
-    const req = computeTaskRequirements("research-milestone");
-    assert.deepStrictEqual(req, { research: 0.9, longContext: 0.7, reasoning: 0.5 });
-  });
-  test("plan-slice returns correct base vector", () => {
-    const req = computeTaskRequirements("plan-slice");
-    assert.deepStrictEqual(req, { reasoning: 0.9, coding: 0.5 });
-  });
-  test("unknown-unit-type returns default reasoning requirement", () => {
-    const req = computeTaskRequirements("unknown-unit-type");
-    assert.deepStrictEqual(req, { reasoning: 0.5 });
-  });
-  test("non-execute-task with metadata ignores metadata refinements", () => {
-    // research-milestone should return the same vector regardless of metadata
-    const reqWithMeta = computeTaskRequirements("research-milestone", { tags: ["docs"], fileCount: 10 });
-    const reqWithout = computeTaskRequirements("research-milestone");
-    assert.deepStrictEqual(reqWithMeta, reqWithout);
-  });
-});
-// ─── scoreEligibleModels ─────────────────────────────────────────────────────
-describe("scoreEligibleModels", () => {
-  test("ranks models by score descending when scores differ by more than 2", () => {
-    // research: heavily weights research dimension. gemini-2.5-pro has 85 research vs sonnet's 75
-    const requirements = { research: 0.9, longContext: 0.7, reasoning: 0.5 };
-    const results = scoreEligibleModels(["claude-sonnet-4-6", "gemini-2.5-pro"], requirements);
-    assert.equal(results.length, 2);
-    assert.ok(results[0].score >= results[1].score, "Should be sorted by score descending");
-  });
-  test("within 2-point threshold, prefers cheaper model", () => {
-    // Use models without built-in profiles (both get score 50) so tie-break applies
-    // Then use known models with equal scores: force this via single unknown model pair
-    const requirements = { coding: 1.0 };
-    // model-a and model-b are both unknown → score=50, cost=Infinity → lexicographic
-    const results = scoreEligibleModels(["model-z", "model-a"], requirements);
-    // Both unknown: score=50 (within 2), cost=Infinity (equal) → lex: model-a first
-    assert.equal(results[0].modelId, "model-a");
-  });
-  test("single model returns array of one", () => {
-    const results = scoreEligibleModels(["claude-sonnet-4-6"], { coding: 0.9 });
-    assert.equal(results.length, 1);
-    assert.equal(results[0].modelId, "claude-sonnet-4-6");
-  });
-  test("unknown model with no profile gets score of 50", () => {
-    const results = scoreEligibleModels(["totally-unknown-model"], { coding: 1.0 });
-    assert.equal(results[0].score, 50);
-  });
-  test("capabilityOverrides deep-merges with built-in profile", () => {
-    const requirements = { coding: 1.0 };
-    // Override sonnet's coding to 30 — gpt-4o (coding=80) should win
-    const results = scoreEligibleModels(
-      ["claude-sonnet-4-6", "gpt-4o"],
-      requirements,
-      { "claude-sonnet-4-6": { coding: 30 } },
-    );
-    assert.equal(results[0].modelId, "gpt-4o", "gpt-4o should rank first after coding override");
-  });
-});
-// ─── getEligibleModels ───────────────────────────────────────────────────────
-describe("getEligibleModels", () => {
-  const ALL_MODELS = [
-    "claude-opus-4-6",   // heavy
-    "claude-sonnet-4-6", // standard
-    "claude-haiku-4-5",  // light
-    "gpt-4o-mini",       // light
-    "gpt-4o",            // standard
-  ];
-  test("returns light-tier models from available list sorted by cost", () => {
-    const config: DynamicRoutingConfig = defaultRoutingConfig();
-    const result = getEligibleModels("light", ALL_MODELS, config);
-    assert.ok(result.length >= 1);
-    for (const id of result) {
-      assert.ok(
-        ["claude-haiku-4-5", "gpt-4o-mini"].includes(id),
-        `Expected light-tier model, got ${id}`,
-      );
-    }
-  });
-  test("returns standard-tier models from available list sorted by cost", () => {
-    const config: DynamicRoutingConfig = defaultRoutingConfig();
-    const result = getEligibleModels("standard", ALL_MODELS, config);
-    assert.ok(result.length >= 1);
-    for (const id of result) {
-      assert.ok(
-        ["claude-sonnet-4-6", "gpt-4o"].includes(id),
-        `Expected standard-tier model, got ${id}`,
-      );
-    }
-  });
-  test("tier_models pinned model returns single-element array", () => {
-    const config: DynamicRoutingConfig = {
-      ...defaultRoutingConfig(),
-      tier_models: { light: "gpt-4o-mini" },
-    };
-    const result = getEligibleModels("light", ALL_MODELS, config);
-    assert.deepStrictEqual(result, ["gpt-4o-mini"]);
-  });
-  test("empty available list returns empty array", () => {
-    const config: DynamicRoutingConfig = defaultRoutingConfig();
-    const result = getEligibleModels("light", [], config);
-    assert.equal(result.length, 0);
-  });
-  test("unknown models classified as standard appear in standard tier results", () => {
-    const config: DynamicRoutingConfig = defaultRoutingConfig();
-    // unknown-model-xyz has no entry → defaults to standard tier
-    const result = getEligibleModels("standard", ["unknown-model-xyz"], config);
-    assert.ok(result.includes("unknown-model-xyz"), "Unknown model should appear in standard tier");
-  });
-});
-// ─── capability-aware routing integration ────────────────────────────────────
-describe("capability-aware routing integration", () => {
-  // All standard-tier models available alongside heavy (opus)
-  const MULTI_MODEL_AVAILABLE = [
-    "claude-opus-4-6",
-    "claude-sonnet-4-6",
-    "gpt-4o",
-    "gemini-2.5-pro",
-    "claude-haiku-4-5",
-    "gpt-4o-mini",
-  ];
-  // 1. Full pipeline with capability scoring active
-  test("full pipeline with capability_routing: true returns capability-scored decision", () => {
-    const config: DynamicRoutingConfig = { ...defaultRoutingConfig(), enabled: true, capability_routing: true };
-    // Configured primary is opus (heavy) — standard tier should trigger capability scoring
-    const result = resolveModelForComplexity(
-      { tier: "standard", reason: "test", downgraded: false },
-      { primary: "claude-opus-4-6", fallbacks: [] },
-      config,
-      MULTI_MODEL_AVAILABLE,
-      "execute-task",
-      { tags: [], complexityKeywords: [], fileCount: 3, estimatedLines: 100, codeBlockCount: 0 },
-    );
-    assert.equal(result.selectionMethod, "capability-scored", "should use capability scoring when enabled with multiple eligible models");
-    assert.ok(result.capabilityScores !== undefined, "capabilityScores should be populated");
-    assert.ok(Object.keys(result.capabilityScores!).length > 1, "should have scores for multiple models");
-    assert.equal(result.wasDowngraded, true, "should be downgraded from opus");
-  });
-  // 2. capability_routing: false falls back to tier-only
-  test("capability_routing: false skips scoring and uses tier-only", () => {
-    const config: DynamicRoutingConfig = { ...defaultRoutingConfig(), enabled: true, capability_routing: false };
-    const result = resolveModelForComplexity(
-      { tier: "standard", reason: "test", downgraded: false },
-      { primary: "claude-opus-4-6", fallbacks: [] },
-      config,
-      MULTI_MODEL_AVAILABLE,
-      "execute-task",
-      undefined,
-    );
-    assert.equal(result.selectionMethod, "tier-only", "capability_routing: false should use tier-only");
-    assert.equal(result.capabilityScores, undefined, "capabilityScores should be undefined for tier-only");
-  });
-  // 3. Single eligible model skips scoring
-  test("single eligible model skips capability scoring and uses tier-only", () => {
-    const config: DynamicRoutingConfig = {
-      ...defaultRoutingConfig(),
-      enabled: true,
-      capability_routing: true,
-      tier_models: { standard: "claude-sonnet-4-6" },
-    };
-    // Pin to single standard model — eligible.length === 1 → skips STEP 2
-    const result = resolveModelForComplexity(
-      { tier: "standard", reason: "test", downgraded: false },
-      { primary: "claude-opus-4-6", fallbacks: [] },
-      config,
-      MULTI_MODEL_AVAILABLE,
-      "execute-task",
-      undefined,
-    );
-    // Single pinned model → tier-only (no scoring needed)
-    assert.equal(result.selectionMethod, "tier-only", "single eligible model should use tier-only");
-    assert.equal(result.modelId, "claude-sonnet-4-6", "should use the pinned model");
-  });
-  // 4. Unknown model with no profile gets uniform 50s and competes
-  test("unknown model with no profile gets uniform score of 50 and can compete", () => {
-    const unknownModel = "unknown-future-model-xyz";
-    const config: DynamicRoutingConfig = { ...defaultRoutingConfig(), enabled: true, capability_routing: true };
-    // Add unknown model to available list at standard tier (unknown → standard per D-15)
-    // scoring should still work with score=50 for the unknown model
-    const requirements = { coding: 0.9, instruction: 0.7, speed: 0.3 };
-    const scored = scoreEligibleModels([unknownModel, "claude-sonnet-4-6"], requirements);
-    const unknownEntry = scored.find(s => s.modelId === unknownModel);
-    assert.ok(unknownEntry !== undefined, "unknown model should be in scored results");
-    // Unknown model gets uniform 50s: (0.9*50 + 0.7*50 + 0.3*50) / (0.9+0.7+0.3) ≈ 50
-    assert.ok(Math.abs(unknownEntry!.score - 50) < 0.01, `expected score ~50, got ${unknownEntry!.score}`);
-  });
-  // 5. Capability overrides change scoring outcome
-  test("capabilityOverrides boost a model above another for same task", () => {
-    // sonnet: coding=85, gpt-4o: coding=80. Override gpt-4o coding to 99 → gpt-4o should win.
-    const requirements = { coding: 1.0 };
-    const overrides = { "gpt-4o": { coding: 99 } };
-    const scored = scoreEligibleModels(["claude-sonnet-4-6", "gpt-4o"], requirements, overrides);
-    assert.equal(scored[0].modelId, "gpt-4o", "overridden model should win for coding-heavy task");
-    assert.ok(scored[0].score > 90, `expected score > 90 after override, got ${scored[0].score}`);
-  });
-  // 5b. Capability overrides pass through resolveModelForComplexity to scoreEligibleModels
-  test("resolveModelForComplexity passes capabilityOverrides to scoring step", () => {
-    const config: DynamicRoutingConfig = { ...defaultRoutingConfig(), enabled: true, capability_routing: true };
-    // sonnet coding=85, gpt-4o coding=80. Override gpt-4o coding to 99 → gpt-4o should win.
-    const overrides: Record<string, Partial<ModelCapabilities>> = { "gpt-4o": { coding: 99 } };
-    const result = resolveModelForComplexity(
-      { tier: "standard", reason: "test", downgraded: false },
-      { primary: "claude-opus-4-6", fallbacks: [] },
-      config,
-      ["claude-opus-4-6", "claude-sonnet-4-6", "gpt-4o"],
-      "execute-task",
-      undefined,
-      overrides,
-    );
-    assert.equal(result.selectionMethod, "capability-scored");
-    assert.equal(result.modelId, "gpt-4o", "gpt-4o should win with coding override");
-  });
-  // 6. Regression: existing routing guards unchanged
-  test("regression: routing-disabled passthrough still returns tier-only", () => {
-    const config: DynamicRoutingConfig = { ...defaultRoutingConfig(), enabled: false };
-    const result = resolveModelForComplexity(
-      { tier: "light", reason: "test", downgraded: false },
-      { primary: "claude-opus-4-6", fallbacks: [] },
-      config,
-      MULTI_MODEL_AVAILABLE,
-      "execute-task",
-      undefined,
-    );
-    assert.equal(result.selectionMethod, "tier-only");
-    assert.equal(result.wasDowngraded, false);
-    assert.equal(result.modelId, "claude-opus-4-6");
-  });
-  test("regression: unknown-model bypass returns tier-only and does not downgrade", () => {
-    const config: DynamicRoutingConfig = { ...defaultRoutingConfig(), enabled: true };
-    const result = resolveModelForComplexity(
-      { tier: "light", reason: "test", downgraded: false },
-      { primary: "totally-unknown-custom-model", fallbacks: [] },
-      config,
-      ["totally-unknown-custom-model", ...MULTI_MODEL_AVAILABLE],
-      "execute-task",
-      undefined,
-    );
-    assert.equal(result.selectionMethod, "tier-only");
-    assert.equal(result.wasDowngraded, false);
-    assert.equal(result.modelId, "totally-unknown-custom-model");
-  });
-  test("regression: no-downgrade-needed path returns tier-only", () => {
-    const config: DynamicRoutingConfig = { ...defaultRoutingConfig(), enabled: true, capability_routing: true };
-    // Configured model is sonnet (standard), requesting standard → no downgrade needed
-    const result = resolveModelForComplexity(
-      { tier: "standard", reason: "test", downgraded: false },
-      { primary: "claude-sonnet-4-6", fallbacks: [] },
-      config,
-      MULTI_MODEL_AVAILABLE,
-      "execute-task",
-      undefined,
-    );
-    assert.equal(result.selectionMethod, "tier-only");
-    assert.equal(result.wasDowngraded, false);
-    assert.equal(result.modelId, "claude-sonnet-4-6");
-  });
-});
-// ─── getModelTier unknown default ────────────────────────────────────────────
-describe("getModelTier unknown default", () => {
-  test("unknown model returns standard tier (not heavy) via downgrade behavior", () => {
-    // We can verify this indirectly: resolveModelForComplexity for a standard classification
-    // with an unknown primary model should NOT downgrade (because unknown → standard, not heavy)
-    const config = { ...defaultRoutingConfig(), enabled: true };
-    // Use "unknown-model-xyz" as primary — its tier will be "standard" per D-15
-    // Classification is "heavy" → tier >= standard → no downgrade
-    // But unknown models use the isKnownModel() guard, so they pass through anyway
-    // Test the positive: an unknown model is NOT treated as heavy
-    const result = resolveModelForComplexity(
-      makeClassification("standard"),
-      { primary: "claude-sonnet-4-6", fallbacks: [] },
-      config,
-      ["claude-sonnet-4-6", "claude-haiku-4-5", "gpt-4o-mini"],
-    );
-    // standard classification with standard model (sonnet) → no downgrade
-    assert.equal(result.wasDowngraded, false, "standard model should not downgrade for standard task");
-    assert.equal(result.modelId, "claude-sonnet-4-6");
-  });
-  test("unknown model in getEligibleModels defaults to standard tier", () => {
-    // Per D-15: getModelTier returns "standard" for unknown models
-    const config: DynamicRoutingConfig = defaultRoutingConfig();
-    const standardModels = getEligibleModels("standard", ["totally-unknown-model-abc"], config);
-    const lightModels = getEligibleModels("light", ["totally-unknown-model-abc"], config);
-    const heavyModels = getEligibleModels("heavy", ["totally-unknown-model-abc"], config);
-    assert.ok(standardModels.includes("totally-unknown-model-abc"), "Unknown model should be in standard tier");
-    assert.equal(lightModels.length, 0, "Unknown model should NOT be in light tier");
-    assert.equal(heavyModels.length, 0, "Unknown model should NOT be in heavy tier");
-  });
-});

package/src/resources/extensions/gsd/tests/preferences.test.ts CHANGED Viewed

@@ -461,65 +461,3 @@ test("experimental.rtk defaults to off in new project preferences", () => {
   assert.notEqual(prefs, null);
   assert.equal(prefs!.experimental?.rtk, undefined);
 });
-// ── Codebase Map Preferences ─────────────────────────────────────────────────
-test("codebase preferences validate and pass through correctly", () => {
-  const result = validatePreferences({
-    codebase: {
-      exclude_patterns: ["docs/", "fixtures/"],
-      max_files: 1000,
-      collapse_threshold: 15,
-    },
-  });
-  assert.equal(result.errors.length, 0);
-  assert.deepEqual(result.preferences.codebase?.exclude_patterns, ["docs/", "fixtures/"]);
-  assert.equal(result.preferences.codebase?.max_files, 1000);
-  assert.equal(result.preferences.codebase?.collapse_threshold, 15);
-});
-test("codebase preferences reject invalid types", () => {
-  const result = validatePreferences({
-    codebase: {
-      exclude_patterns: "not-an-array" as any,
-      max_files: -5,
-      collapse_threshold: 0,
-    },
-  });
-  assert.ok(result.errors.some(e => e.includes("exclude_patterns must be an array")));
-  assert.ok(result.errors.some(e => e.includes("max_files must be a positive")));
-  assert.ok(result.errors.some(e => e.includes("collapse_threshold must be a positive")));
-});
-test("codebase preferences warn on unknown keys", () => {
-  const result = validatePreferences({
-    codebase: {
-      exclude_patterns: ["docs/"],
-      unknown_key: true,
-    } as any,
-  });
-  assert.equal(result.errors.length, 0);
-  assert.ok(result.warnings.some(w => w.includes('unknown codebase key "unknown_key"')));
-  assert.deepEqual(result.preferences.codebase?.exclude_patterns, ["docs/"]);
-});
-test("codebase preferences parse from markdown frontmatter", () => {
-  const content = [
-    "---",
-    "version: 1",
-    "codebase:",
-    "  exclude_patterns:",
-    '    - "docs/"',
-    '    - ".cache/"',
-    "  max_files: 800",
-    "  collapse_threshold: 10",
-    "---",
-  ].join("\n");
-  const prefs = parsePreferencesMarkdown(content);
-  assert.notEqual(prefs, null);
-  const result = validatePreferences(prefs!);
-  assert.equal(result.errors.length, 0);
-  assert.deepEqual(result.preferences.codebase?.exclude_patterns, ["docs/", ".cache/"]);
-  assert.equal(result.preferences.codebase?.max_files, 800);
-  assert.equal(result.preferences.codebase?.collapse_threshold, 10);
-});

package/src/resources/extensions/gsd/tests/remote-questions.test.ts CHANGED Viewed

@@ -739,27 +739,6 @@ test("config source-level: hydration skips api_key entries with empty keys", ()
   );
 });
-test("ask-user-questions source-level: tryRemoteQuestions is called before the hasUI guard", () => {
-  // Regression test for #3480 — remote questions were silently skipped in interactive
-  // mode because tryRemoteQuestions was gated behind `if (!ctx.hasUI)`.
-  // The fix moved the remote call before that guard so configured channels
-  // (Telegram/Slack/Discord) fire regardless of UI availability.
-  const src = readFileSync(
-    join(__dirname, "..", "..", "ask-user-questions.ts"),
-    "utf-8",
-  );
-  const remoteCallIdx = src.indexOf("tryRemoteQuestions(params.questions");
-  const hasUIGuardIdx = src.indexOf("if (!ctx.hasUI)");
-  assert.ok(remoteCallIdx !== -1, "tryRemoteQuestions call should exist in ask-user-questions.ts");
-  assert.ok(hasUIGuardIdx !== -1, "!ctx.hasUI guard should exist in ask-user-questions.ts");
-  assert.ok(
-    remoteCallIdx < hasUIGuardIdx,
-    "tryRemoteQuestions must be called before the !ctx.hasUI guard — otherwise remote questions are skipped in interactive mode",
-  );
-});
 test("config source-level: removeProviderToken uses auth.remove not auth.set with empty key", () => {
   const commandSrc = readFileSync(
     join(__dirname, "..", "..", "remote-questions", "remote-command.ts"),

package/src/resources/extensions/gsd/tests/workflow-logger.test.ts CHANGED Viewed

@@ -240,13 +240,13 @@ describe("workflow-logger", () => {
     test("writes entry to .gsd/audit-log.jsonl after setLogBasePath", () => {
       setLogBasePath(dir);
-      logError("engine", "audit test entry");
+      logWarning("engine", "audit test entry");
       const auditPath = join(dir, ".gsd", "audit-log.jsonl");
       assert.ok(existsSync(auditPath), "audit-log.jsonl should exist");
       const content = readFileSync(auditPath, "utf-8");
       const entry = JSON.parse(content.trim());
-      assert.equal(entry.severity, "error");
+      assert.equal(entry.severity, "warn");
       assert.equal(entry.component, "engine");
       assert.equal(entry.message, "audit test entry");
     });
@@ -254,7 +254,7 @@ describe("workflow-logger", () => {
     test("_resetLogs does not clear the audit base path", () => {
       setLogBasePath(dir);
       _resetLogs();
-      logError("engine", "post-reset entry");
+      logWarning("engine", "post-reset entry");
       const auditPath = join(dir, ".gsd", "audit-log.jsonl");
       assert.ok(existsSync(auditPath), "audit-log.jsonl should exist after _resetLogs");
@@ -293,13 +293,13 @@ describe("workflow-logger", () => {
     test("writes entry to .gsd/audit-log.jsonl after setLogBasePath", () => {
       setLogBasePath(dir);
-      logError("engine", "audit test entry");
+      logWarning("engine", "audit test entry");
       const auditPath = join(dir, ".gsd", "audit-log.jsonl");
       assert.ok(existsSync(auditPath), "audit-log.jsonl should exist");
       const content = readFileSync(auditPath, "utf-8");
       const entry = JSON.parse(content.trim());
-      assert.equal(entry.severity, "error");
+      assert.equal(entry.severity, "warn");
       assert.equal(entry.component, "engine");
       assert.equal(entry.message, "audit test entry");
     });
@@ -307,7 +307,7 @@ describe("workflow-logger", () => {
     test("_resetLogs does not clear the audit base path", () => {
       setLogBasePath(dir);
       _resetLogs();
-      logError("engine", "post-reset entry");
+      logWarning("engine", "post-reset entry");
       const auditPath = join(dir, ".gsd", "audit-log.jsonl");
       assert.ok(existsSync(auditPath), "audit-log.jsonl should exist after _resetLogs");

package/src/resources/extensions/gsd/tools/complete-milestone.ts CHANGED Viewed

@@ -23,7 +23,6 @@ import { invalidateStateCache } from "../state.js";
 import { renderAllProjections } from "../workflow-projections.js";
 import { writeManifest } from "../workflow-manifest.js";
 import { appendEvent } from "../workflow-events.js";
-import { logWarning } from "../workflow-logger.js";
 export interface CompleteMilestoneParams {
   milestoneId: string;
@@ -192,7 +191,9 @@ export async function handleCompleteMilestone(
     await saveFile(summaryPath, summaryMd);
   } catch (renderErr) {
     // Disk render failed — roll back DB status so state stays consistent
-    logWarning("tool", `complete_milestone — disk render failed, rolling back DB status: ${(renderErr as Error).message}`);
+    process.stderr.write(
+      `gsd-db: complete_milestone — disk render failed, rolling back DB status: ${(renderErr as Error).message}\n`,
+    );
     updateMilestoneStatus(params.milestoneId, 'active', null);
     invalidateStateCache();
     return { error: `disk render failed: ${(renderErr as Error).message}` };
@@ -216,7 +217,9 @@ export async function handleCompleteMilestone(
       trigger_reason: params.triggerReason,
     });
   } catch (hookErr) {
-    logWarning("tool", `complete-milestone post-mutation hook warning: ${(hookErr as Error).message}`);
+    process.stderr.write(
+      `gsd: complete-milestone post-mutation hook warning: ${(hookErr as Error).message}\n`,
+    );
   }
   return {

package/src/resources/extensions/gsd/tools/complete-slice.ts CHANGED Viewed

@@ -30,7 +30,6 @@ import { renderRoadmapCheckboxes } from "../markdown-renderer.js";
 import { renderAllProjections } from "../workflow-projections.js";
 import { writeManifest } from "../workflow-manifest.js";
 import { appendEvent } from "../workflow-events.js";
-import { logWarning } from "../workflow-logger.js";
 export interface CompleteSliceResult {
   sliceId: string;
@@ -298,7 +297,9 @@ export async function handleCompleteSlice(
     }
   } catch (renderErr) {
     // Disk render failed — roll back DB status so state stays consistent
-    logWarning("tool", `complete_slice — disk render failed, rolling back DB status: ${(renderErr as Error).message}`);
+    process.stderr.write(
+      `gsd-db: complete_slice — disk render failed, rolling back DB status: ${(renderErr as Error).message}\n`,
+    );
     updateSliceStatus(params.milestoneId, params.sliceId, 'pending');
     invalidateStateCache();
     return { error: `disk render failed: ${(renderErr as Error).message}` };
@@ -325,7 +326,9 @@ export async function handleCompleteSlice(
       trigger_reason: params.triggerReason,
     });
   } catch (hookErr) {
-    logWarning("tool", `complete-slice post-mutation hook warning: ${(hookErr as Error).message}`);
+    process.stderr.write(
+      `gsd: complete-slice post-mutation hook warning: ${(hookErr as Error).message}\n`,
+    );
   }
   return {

package/src/resources/extensions/gsd/tools/complete-task.ts CHANGED Viewed

@@ -33,7 +33,6 @@ import { renderPlanCheckboxes } from "../markdown-renderer.js";
 import { renderAllProjections, renderSummaryContent } from "../workflow-projections.js";
 import { writeManifest } from "../workflow-manifest.js";
 import { appendEvent } from "../workflow-events.js";
-import { logWarning } from "../workflow-logger.js";
 export interface CompleteTaskResult {
   taskId: string;
@@ -211,7 +210,9 @@ export async function handleCompleteTask(
     }
   } catch (renderErr) {
     // Disk render failed — roll back DB status so state stays consistent
-    logWarning("tool", `complete_task — disk render failed, rolling back DB status: ${(renderErr as Error).message}`);
+    process.stderr.write(
+      `gsd-db: complete_task — disk render failed, rolling back DB status: ${(renderErr as Error).message}\n`,
+    );
     // Delete orphaned verification_evidence rows first (FK constraint
     // references tasks, so evidence must go before status change).
     // Without this, retries accumulate duplicate evidence rows (#2724).
@@ -242,7 +243,9 @@ export async function handleCompleteTask(
       trigger_reason: params.triggerReason,
     });
   } catch (hookErr) {
-    logWarning("tool", `complete-task post-mutation hook warning: ${(hookErr as Error).message}`);
+    process.stderr.write(
+      `gsd: complete-task post-mutation hook warning: ${(hookErr as Error).message}\n`,
+    );
   }
   return {