npm - @undeemed/get-shit-done-codex - Versions diffs - 1.24.1 → 1.24.3 - Mend

@undeemed/get-shit-done-codex 1.24.1 → 1.24.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (12) hide show

package/README.md +72 -12
package/get-shit-done/AGENTS.md +59 -23
package/get-shit-done/bin/gsd-tools.cjs +293 -124
package/get-shit-done/bin/lib/core.cjs +16 -16
package/get-shit-done/references/model-profile-resolution.md +2 -2
package/get-shit-done/references/model-profiles.md +29 -29
package/get-shit-done/workflows/help.md +3 -3
package/get-shit-done/workflows/new-project.md +6 -6
package/get-shit-done/workflows/set-profile.md +3 -3
package/get-shit-done/workflows/settings.md +3 -3
package/package.json +3 -2
package/scripts/run-tests.cjs +38 -24

package/get-shit-done/bin/lib/core.cjs CHANGED Viewed

@@ -16,21 +16,21 @@ function toPosixPath(p) {
 // ─── Model Profile Table ─────────────────────────────────────────────────────
 const MODEL_PROFILES = {
-  //                              quality                          balanced                         budget
-  'gsd-planner':              { quality: { m: 'gpt-5.3-codex', t: 'high' },   balanced: { m: 'gpt-5.3-codex', t: 'high' },   budget: { m: 'gpt-5.3-codex', t: 'medium' } },
-  'gsd-roadmapper':           { quality: { m: 'gpt-5.3-codex', t: 'high' },   balanced: { m: 'gpt-5.3-codex', t: 'medium' }, budget: { m: 'gpt-5.3-codex', t: 'low' } },
-  'gsd-executor':             { quality: { m: 'gpt-5.3-codex', t: 'high' },   balanced: { m: 'gpt-5.3-codex', t: 'medium' }, budget: { m: 'gpt-5.3-codex', t: 'low' } },
-  'gsd-phase-researcher':     { quality: { m: 'gpt-5.3-codex', t: 'medium' }, balanced: { m: 'gpt-5.3-codex', t: 'low' },    budget: { m: 'gpt-5.3-codex', t: 'low' } },
-  'gsd-project-researcher':   { quality: { m: 'gpt-5.3-codex', t: 'medium' }, balanced: { m: 'gpt-5.3-codex', t: 'low' },    budget: { m: 'gpt-5.3-codex', t: 'low' } },
-  'gsd-research-synthesizer': { quality: { m: 'gpt-5.3-codex', t: 'medium' }, balanced: { m: 'gpt-5.3-codex', t: 'low' },    budget: { m: 'gpt-5.3-codex', t: 'low' } },
-  'gsd-debugger':             { quality: { m: 'gpt-5.3-codex', t: 'high' },   balanced: { m: 'gpt-5.3-codex', t: 'high' },   budget: { m: 'gpt-5.3-codex', t: 'medium' } },
-  'gsd-codebase-mapper':      { quality: { m: 'gpt-5.3-codex', t: 'low' },    balanced: { m: 'gpt-5.3-codex', t: 'low' },    budget: { m: 'gpt-5.3-codex', t: 'low' } },
-  'gsd-verifier':             { quality: { m: 'gpt-5.3-codex', t: 'medium' }, balanced: { m: 'gpt-5.3-codex', t: 'medium' }, budget: { m: 'gpt-5.3-codex', t: 'low' } },
-  'gsd-plan-checker':         { quality: { m: 'gpt-5.3-codex', t: 'medium' }, balanced: { m: 'gpt-5.3-codex', t: 'low' },    budget: { m: 'gpt-5.3-codex', t: 'low' } },
-  'gsd-integration-checker':  { quality: { m: 'gpt-5.3-codex', t: 'medium' }, balanced: { m: 'gpt-5.3-codex', t: 'low' },    budget: { m: 'gpt-5.3-codex', t: 'low' } },
+  //                              quality                           balanced                          budget
+  'gsd-planner':              { quality: { m: 'gpt-5.3-codex', t: 'xhigh' },  balanced: { m: 'gpt-5.3-codex', t: 'xhigh' },  budget: { m: 'gpt-5.3-codex', t: 'high' } },
+  'gsd-roadmapper':           { quality: { m: 'gpt-5.3-codex', t: 'xhigh' },  balanced: { m: 'gpt-5.3-codex', t: 'high' },   budget: { m: 'gpt-5.3-codex', t: 'medium' } },
+  'gsd-executor':             { quality: { m: 'gpt-5.3-codex', t: 'xhigh' },  balanced: { m: 'gpt-5.3-codex', t: 'high' },   budget: { m: 'gpt-5.3-codex', t: 'medium' } },
+  'gsd-phase-researcher':     { quality: { m: 'gpt-5.3-codex', t: 'high' },   balanced: { m: 'gpt-5.3-codex', t: 'medium' }, budget: { m: 'gpt-5.3-codex', t: 'medium' } },
+  'gsd-project-researcher':   { quality: { m: 'gpt-5.3-codex', t: 'high' },   balanced: { m: 'gpt-5.3-codex', t: 'medium' }, budget: { m: 'gpt-5.3-codex', t: 'medium' } },
+  'gsd-research-synthesizer': { quality: { m: 'gpt-5.3-codex', t: 'high' },   balanced: { m: 'gpt-5.3-codex', t: 'medium' }, budget: { m: 'gpt-5.3-codex', t: 'medium' } },
+  'gsd-debugger':             { quality: { m: 'gpt-5.3-codex', t: 'xhigh' },  balanced: { m: 'gpt-5.3-codex', t: 'xhigh' },  budget: { m: 'gpt-5.3-codex', t: 'high' } },
+  'gsd-codebase-mapper':      { quality: { m: 'gpt-5.3-codex', t: 'medium' }, balanced: { m: 'gpt-5.3-codex', t: 'medium' }, budget: { m: 'gpt-5.3-codex', t: 'medium' } },
+  'gsd-verifier':             { quality: { m: 'gpt-5.3-codex', t: 'high' },   balanced: { m: 'gpt-5.3-codex', t: 'high' },   budget: { m: 'gpt-5.3-codex', t: 'medium' } },
+  'gsd-plan-checker':         { quality: { m: 'gpt-5.3-codex', t: 'high' },   balanced: { m: 'gpt-5.3-codex', t: 'medium' }, budget: { m: 'gpt-5.3-codex', t: 'medium' } },
+  'gsd-integration-checker':  { quality: { m: 'gpt-5.3-codex', t: 'high' },   balanced: { m: 'gpt-5.3-codex', t: 'medium' }, budget: { m: 'gpt-5.3-codex', t: 'medium' } },
 };
-const DEFAULT_ENTRY = { m: 'gpt-5.3-codex', t: 'medium' };
+const DEFAULT_ENTRY = { m: 'gpt-5.3-codex', t: 'high' };
 // ─── Output helpers ───────────────────────────────────────────────────────────
@@ -366,15 +366,15 @@ function resolveModelInternal(cwd, agentType) {
   if (override) {
     // Override can be a string (thinking level) or { m, t } object
     if (typeof override === 'string') {
-      return { model: 'inherit', thinking: override === 'high' || override === 'medium' || override === 'low' ? override : 'medium' };
+      return { model: 'inherit', thinking: override === 'xhigh' || override === 'high' || override === 'medium' || override === 'low' ? override : 'high' };
     }
-    return { model: 'inherit', thinking: override.t || 'medium' };
+    return { model: 'inherit', thinking: override.t || 'high' };
   }
   // Fall back to profile lookup
   const profile = config.model_profile || 'balanced';
   const agentModels = MODEL_PROFILES[agentType];
-  if (!agentModels) return { model: 'inherit', thinking: 'medium' };
+  if (!agentModels) return { model: 'inherit', thinking: 'high' };
   const entry = agentModels[profile] || agentModels['balanced'] || DEFAULT_ENTRY;
   return { model: 'inherit', thinking: entry.t };
 }

package/get-shit-done/references/model-profile-resolution.md CHANGED Viewed

@@ -17,7 +17,7 @@ Default: `balanced` if not set or config missing.
 Look up the agent in the table for the resolved profile. Each entry returns:
 ```json
-{ "model": "inherit", "thinking": "high" }
+{ "model": "inherit", "thinking": "xhigh" }
 ```
 All agents use `gpt-5.3-codex` (via `"inherit"`). The `thinking` field controls reasoning effort.
@@ -29,7 +29,7 @@ Task(
   prompt="...",
   subagent_type="gsd-planner",
   model="inherit",
-  thinking="{resolved_thinking}"  # "high", "medium", or "low"
+  thinking="{resolved_thinking}"  # "xhigh", "high", "medium", or "low"
 )
 ```

package/get-shit-done/references/model-profiles.md CHANGED Viewed

@@ -6,17 +6,17 @@ Model profiles control the reasoning effort level for each GSD agent. All agents
 | Agent                    | `quality` | `balanced` | `budget`  |
 | ------------------------ | --------- | ---------- | --------- |
-| gsd-planner              | 🟢 high   | 🟢 high    | 🟡 medium |
-| gsd-roadmapper           | 🟢 high   | 🟡 medium  | 🔵 low    |
-| gsd-executor             | 🟢 high   | 🟡 medium  | 🔵 low    |
-| gsd-phase-researcher     | 🟡 medium | 🔵 low     | 🔵 low    |
-| gsd-project-researcher   | 🟡 medium | 🔵 low     | 🔵 low    |
-| gsd-research-synthesizer | 🟡 medium | 🔵 low     | 🔵 low    |
-| gsd-debugger             | 🟢 high   | 🟢 high    | 🟡 medium |
-| gsd-codebase-mapper      | 🔵 low    | 🔵 low     | 🔵 low    |
-| gsd-verifier             | 🟡 medium | 🟡 medium  | 🔵 low    |
-| gsd-plan-checker         | 🟡 medium | 🔵 low     | 🔵 low    |
-| gsd-integration-checker  | 🟡 medium | 🔵 low     | 🔵 low    |
+| gsd-planner              | 🔴 xhigh  | 🔴 xhigh   | 🟢 high   |
+| gsd-roadmapper           | 🔴 xhigh  | 🟢 high    | 🟡 medium |
+| gsd-executor             | 🔴 xhigh  | 🟢 high    | 🟡 medium |
+| gsd-phase-researcher     | 🟢 high   | 🟡 medium  | 🟡 medium |
+| gsd-project-researcher   | 🟢 high   | 🟡 medium  | 🟡 medium |
+| gsd-research-synthesizer | 🟢 high   | 🟡 medium  | 🟡 medium |
+| gsd-debugger             | 🔴 xhigh  | 🔴 xhigh   | 🟢 high   |
+| gsd-codebase-mapper      | 🟡 medium | 🟡 medium  | 🟡 medium |
+| gsd-verifier             | 🟢 high   | 🟢 high    | 🟡 medium |
+| gsd-plan-checker         | 🟢 high   | 🟡 medium  | 🟡 medium |
+| gsd-integration-checker  | 🟢 high   | 🟡 medium  | 🟡 medium |
 All entries resolve to `model: "inherit"` (uses the session's gpt-5.3-codex). The `thinking` field controls reasoning effort.
@@ -24,39 +24,39 @@ All entries resolve to `model: "inherit"` (uses the session's gpt-5.3-codex). Th
 **quality** - Maximum reasoning for every role
-- 🟢 **high** for decision-makers: planner, roadmapper, executor, debugger
-- 🟡 **medium** for analysis: researchers, verifiers, checkers
-- 🔵 **low** for read-only mapping
+- 🔴 **xhigh** for decision-makers: planner, roadmapper, executor, debugger
+- 🟢 **high** for analysis: researchers, verifiers, checkers
+- 🟡 **medium** for read-only mapping
 - Use when: critical architecture work, complex debugging
 **balanced** (default) - Smart thinking allocation
-- 🟢 **high** only for planner and debugger (highest-impact decisions)
-- 🟡 **medium** for executor and verifier (needs reasoning but follows plans)
-- 🔵 **low** for everything else (structured output, scanning)
+- 🔴 **xhigh** only for planner and debugger (highest-impact decisions)
+- 🟢 **high** for executor and verifier (needs reasoning but follows plans)
+- 🟡 **medium** for everything else (structured output, scanning)
 - Use when: normal development
 **budget** - Minimal reasoning budget
-- 🟡 **medium** for planner and debugger (always need some reasoning)
-- 🔵 **low** for everything else
+- 🟢 **high** for planner and debugger (always need some reasoning)
+- 🟡 **medium** for everything else
 - Use when: high-volume work, less critical phases
 ## Role-Based Thinking Rationale
-**Why high thinking for gsd-planner?**
+**Why xhigh thinking for gsd-planner?**
 Planning involves architecture decisions, goal decomposition, and task design. These decisions cascade through the entire phase — worth the extra reasoning budget.
-**Why high thinking for gsd-debugger even in balanced?**
+**Why xhigh thinking for gsd-debugger even in balanced?**
 Root cause analysis requires deep reasoning. A debugger that misdiagnoses wastes more tokens in re-runs than the reasoning cost.
-**Why low thinking for gsd-codebase-mapper?**
+**Why medium thinking for gsd-codebase-mapper?**
 Read-only file scanning and pattern extraction. No decisions to make — just structured output from file contents.
-**Why medium thinking for gsd-verifier in balanced?**
-Verification requires goal-backward reasoning — checking if code _delivers_ what the phase promised. Low thinking may miss subtle gaps.
+**Why high thinking for gsd-verifier in balanced?**
+Verification requires goal-backward reasoning — checking if code _delivers_ what the phase promised. Medium thinking may miss subtle gaps.
-**Why low thinking for researchers in balanced?**
+**Why medium thinking for researchers in balanced?**
 Research agents scan and collect information. The synthesis happens elsewhere. They don't need deep reasoning for reading files.
 ## Resolution Logic
@@ -70,7 +70,7 @@ Orchestrators resolve model and thinking before spawning:
 4. Pass model + thinking to Task call
 ```
-Returns: `{ model: "inherit", thinking: "high"|"medium"|"low" }`
+Returns: `{ model: "inherit", thinking: "xhigh"|"high"|"medium"|"low" }`
 ## Per-Agent Overrides
@@ -80,13 +80,13 @@ Override thinking level for specific agents:
 {
   "model_profile": "balanced",
   "model_overrides": {
-    "gsd-executor": "high",
-    "gsd-codebase-mapper": "medium"
+    "gsd-executor": "xhigh",
+    "gsd-codebase-mapper": "high"
   }
 }
 ```
-Valid override values: `"high"`, `"medium"`, `"low"`.
+Valid override values: `"xhigh"`, `"high"`, `"medium"`, `"low"`.
 ## Switching Profiles

package/get-shit-done/workflows/help.md CHANGED Viewed

@@ -309,9 +309,9 @@ Usage: `$gsd-settings`
 **`$gsd-set-profile <profile>`**
 Quick switch model profile for GSD agents.
-- `quality` — high thinking for decision-makers, medium for analysis agents
-- `balanced` — high thinking for planner/debugger, medium/low for others (default)
-- `budget` — minimal thinking — medium for planner/debugger, low everywhere else
+- `quality` — xhigh thinking for decision-makers, high for analysis agents
+- `balanced` — xhigh thinking for planner/debugger, high/medium for others (default)
+- `budget` — minimal thinking — high for planner/debugger, medium everywhere else
 Usage: `$gsd-set-profile budget`

package/get-shit-done/workflows/new-project.md CHANGED Viewed

@@ -164,9 +164,9 @@ AskUserQuestion([
     question: "Which AI models for planning agents?",
     multiSelect: false,
     options: [
-      { label: "Balanced (Recommended)", description: "gpt-5.3-codex — smart thinking allocation per role" },
-      { label: "Quality", description: "gpt-5.3-codex — high thinking for all decision-makers" },
-      { label: "Budget", description: "gpt-5.3-codex — minimal thinking, fastest/cheapest" }
+      { label: "Balanced (Recommended)", description: "gpt-5.3-codex — xhigh/high/medium thinking allocation per role" },
+      { label: "Quality", description: "gpt-5.3-codex — xhigh thinking for all decision-makers" },
+      { label: "Budget", description: "gpt-5.3-codex — high/medium thinking, fastest/cheapest" }
     ]
   }
 ])
@@ -459,9 +459,9 @@ questions: [
     question: "Which AI models for planning agents?",
     multiSelect: false,
     options: [
-      { label: "Balanced (Recommended)", description: "gpt-5.3-codex — smart thinking allocation per role" },
-      { label: "Quality", description: "gpt-5.3-codex — high thinking for all decision-makers" },
-      { label: "Budget", description: "gpt-5.3-codex — minimal thinking, fastest/cheapest" }
+      { label: "Balanced (Recommended)", description: "gpt-5.3-codex — xhigh/high/medium thinking allocation per role" },
+      { label: "Quality", description: "gpt-5.3-codex — xhigh thinking for all decision-makers" },
+      { label: "Budget", description: "gpt-5.3-codex — high/medium thinking, fastest/cheapest" }
     ]
   }
 ]

package/get-shit-done/workflows/set-profile.md CHANGED Viewed

@@ -58,9 +58,9 @@ Agents will now use:
 Example:
 | Agent | Model | Thinking |
 |-------|-------|----------|
-| gsd-planner | gpt-5.3-codex | high |
-| gsd-executor | gpt-5.3-codex | medium |
-| gsd-verifier | gpt-5.3-codex | medium |
+| gsd-planner | gpt-5.3-codex | xhigh |
+| gsd-executor | gpt-5.3-codex | high |
+| gsd-verifier | gpt-5.3-codex | high |
 | ... | ... | ... |
 Next spawned agents will use the new profile.

package/get-shit-done/workflows/settings.md CHANGED Viewed

@@ -43,9 +43,9 @@ AskUserQuestion([
     header: "Model",
     multiSelect: false,
     options: [
-      { label: "Quality", description: "gpt-5.3-codex with high thinking for decision-makers, medium for analysis" },
-      { label: "Balanced (Recommended)", description: "gpt-5.3-codex with high thinking for planner/debugger, lower for others" },
-      { label: "Budget", description: "gpt-5.3-codex with minimal thinking — fastest, lowest cost" }
+      { label: "Quality", description: "gpt-5.3-codex with xhigh thinking for decision-makers, high for analysis" },
+      { label: "Balanced (Recommended)", description: "gpt-5.3-codex with xhigh thinking for planner/debugger, high/medium for others" },
+      { label: "Budget", description: "gpt-5.3-codex with high thinking for planner/debugger, medium everywhere else" }
     ]
   },
   {

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@undeemed/get-shit-done-codex",
-  "version": "1.24.1",
+  "version": "1.24.3",
   "description": "A meta-prompting, context engineering and spec-driven development system for OpenAI Codex (CLI and Desktop). Fork of get-shit-done by TÂCHES, adapted for Codex.",
   "bin": {
     "get-shit-done-codex": "bin/install.js"
@@ -67,6 +67,7 @@
   "scripts": {
     "build:hooks": "node scripts/build-hooks.js",
     "prepublishOnly": "npm run build:hooks",
-    "test": "node --test tests/*.test.cjs"
+    "test": "node scripts/run-tests.cjs",
+    "test:coverage": "node scripts/run-tests.cjs --coverage"
   }
 }

package/scripts/run-tests.cjs CHANGED Viewed

@@ -1,29 +1,43 @@
 #!/usr/bin/env node
-// Cross-platform test runner — resolves test file globs via Node
-// instead of relying on shell expansion (which fails on Windows PowerShell/cmd).
-// Propagates NODE_V8_COVERAGE so c8 collects coverage from the child process.
-'use strict';
-const { readdirSync } = require('fs');
-const { join } = require('path');
-const { execFileSync } = require('child_process');
-const testDir = join(__dirname, '..', 'tests');
-const files = readdirSync(testDir)
-  .filter(f => f.endsWith('.test.cjs'))
-  .sort()
-  .map(f => join('tests', f));
-if (files.length === 0) {
-  console.error('No test files found in tests/');
+const fs = require("node:fs");
+const path = require("node:path");
+const { spawnSync } = require("node:child_process");
+function collectTests(dir) {
+  if (!fs.existsSync(dir)) return [];
+  const entries = fs.readdirSync(dir, { withFileTypes: true });
+  const files = [];
+  for (const entry of entries) {
+    const fullPath = path.join(dir, entry.name);
+    if (entry.isDirectory()) {
+      files.push(...collectTests(fullPath));
+      continue;
+    }
+    if (entry.isFile() && entry.name.endsWith(".test.cjs")) {
+      files.push(fullPath);
+    }
+  }
+  return files;
+}
+const withCoverage = process.argv.includes("--coverage");
+const testFiles = collectTests(path.resolve(__dirname, "..", "tests")).sort();
+if (testFiles.length === 0) {
+  console.error("No test files found in ./tests");
   process.exit(1);
 }
-try {
-  execFileSync(process.execPath, ['--test', ...files], {
-    stdio: 'inherit',
-    env: { ...process.env },
-  });
-} catch (err) {
-  process.exit(err.status || 1);
+const args = [];
+if (withCoverage) args.push("--experimental-test-coverage");
+args.push("--test", ...testFiles);
+const result = spawnSync(process.execPath, args, { stdio: "inherit" });
+if (result.error) {
+  console.error(result.error.message);
+  process.exit(1);
 }
+process.exit(result.status ?? 1);