aiwcli 0.12.6 → 0.12.8

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (163) hide show
  1. package/bin/dev.cmd +3 -3
  2. package/bin/dev.js +16 -16
  3. package/bin/run.cmd +3 -3
  4. package/bin/run.js +21 -21
  5. package/dist/commands/branch.js +7 -2
  6. package/dist/lib/bmad-installer.js +37 -37
  7. package/dist/lib/terminal.d.ts +2 -0
  8. package/dist/lib/terminal.js +57 -7
  9. package/dist/templates/CLAUDE.md +232 -205
  10. package/dist/templates/_shared/.claude/settings.json +65 -65
  11. package/dist/templates/_shared/.claude/{commands/handoff.md → skills/handoff/SKILL.md} +13 -12
  12. package/dist/templates/_shared/.claude/{commands/handoff-resume.md → skills/handoff-resume/SKILL.md} +13 -12
  13. package/dist/templates/_shared/.codex/workflows/handoff.md +226 -226
  14. package/dist/templates/_shared/.windsurf/workflows/handoff.md +226 -226
  15. package/dist/templates/_shared/handoff-system/CLAUDE.md +15 -3
  16. package/dist/templates/_shared/handoff-system/lib/document-generator.ts +215 -215
  17. package/dist/templates/_shared/handoff-system/lib/handoff-reader.ts +158 -158
  18. package/dist/templates/_shared/handoff-system/scripts/resume_handoff.ts +373 -373
  19. package/dist/templates/_shared/handoff-system/scripts/save_handoff.ts +469 -469
  20. package/dist/templates/_shared/handoff-system/workflows/handoff-resume.md +66 -66
  21. package/dist/templates/_shared/handoff-system/workflows/handoff.md +254 -254
  22. package/dist/templates/_shared/hooks-ts/_utils/git-state.ts +2 -2
  23. package/dist/templates/_shared/hooks-ts/archive_plan.ts +159 -159
  24. package/dist/templates/_shared/hooks-ts/context_monitor.ts +147 -147
  25. package/dist/templates/_shared/hooks-ts/file-suggestion.ts +128 -128
  26. package/dist/templates/_shared/hooks-ts/pre_compact.ts +49 -49
  27. package/dist/templates/_shared/hooks-ts/session_end.ts +196 -196
  28. package/dist/templates/_shared/hooks-ts/session_start.ts +163 -163
  29. package/dist/templates/_shared/hooks-ts/task_create_capture.ts +48 -48
  30. package/dist/templates/_shared/hooks-ts/task_update_capture.ts +74 -74
  31. package/dist/templates/_shared/hooks-ts/user_prompt_submit.ts +93 -93
  32. package/dist/templates/_shared/lib-ts/CLAUDE.md +367 -367
  33. package/dist/templates/_shared/lib-ts/base/atomic-write.ts +138 -138
  34. package/dist/templates/_shared/lib-ts/base/constants.ts +24 -6
  35. package/dist/templates/_shared/lib-ts/base/git-state.ts +58 -58
  36. package/dist/templates/_shared/lib-ts/base/hook-utils.ts +582 -582
  37. package/dist/templates/_shared/lib-ts/base/inference.ts +301 -301
  38. package/dist/templates/_shared/lib-ts/base/logger.ts +247 -247
  39. package/dist/templates/_shared/lib-ts/base/state-io.ts +202 -202
  40. package/dist/templates/_shared/lib-ts/base/stop-words.ts +184 -184
  41. package/dist/templates/_shared/lib-ts/base/utils.ts +184 -184
  42. package/dist/templates/_shared/lib-ts/context/CLAUDE.md +134 -0
  43. package/dist/templates/_shared/lib-ts/context/context-formatter.ts +566 -566
  44. package/dist/templates/_shared/lib-ts/context/context-selector.ts +524 -524
  45. package/dist/templates/_shared/lib-ts/context/context-store.ts +712 -712
  46. package/dist/templates/_shared/lib-ts/context/plan-manager.ts +312 -312
  47. package/dist/templates/_shared/lib-ts/context/task-tracker.ts +185 -185
  48. package/dist/templates/_shared/lib-ts/package.json +20 -20
  49. package/dist/templates/_shared/lib-ts/templates/formatters.ts +102 -102
  50. package/dist/templates/_shared/lib-ts/templates/plan-context.ts +58 -58
  51. package/dist/templates/_shared/lib-ts/tsconfig.json +13 -13
  52. package/dist/templates/_shared/lib-ts/types.ts +186 -186
  53. package/dist/templates/_shared/scripts/resolve_context.ts +33 -33
  54. package/dist/templates/_shared/scripts/status_line.ts +687 -690
  55. package/dist/templates/cc-native/.claude/commands/cc-native/rlm/ask.md +136 -136
  56. package/dist/templates/cc-native/.claude/commands/cc-native/rlm/index.md +21 -21
  57. package/dist/templates/cc-native/.claude/commands/cc-native/rlm/overview.md +56 -56
  58. package/dist/templates/cc-native/.claude/commands/cc-native/specdev.md +10 -10
  59. package/dist/templates/cc-native/.claude/settings.json +3 -2
  60. package/dist/templates/cc-native/.windsurf/workflows/cc-native/fix.md +8 -8
  61. package/dist/templates/cc-native/.windsurf/workflows/cc-native/implement.md +8 -8
  62. package/dist/templates/cc-native/.windsurf/workflows/cc-native/research.md +8 -8
  63. package/dist/templates/cc-native/CC-NATIVE-README.md +189 -189
  64. package/dist/templates/cc-native/TEMPLATE-SCHEMA.md +304 -304
  65. package/dist/templates/cc-native/_cc-native/agents/CLAUDE.md +143 -143
  66. package/dist/templates/cc-native/_cc-native/agents/PLAN-ORCHESTRATOR.md +213 -213
  67. package/dist/templates/cc-native/_cc-native/agents/plan-questions/PLAN-QUESTIONER.md +70 -70
  68. package/dist/templates/cc-native/_cc-native/artifacts/CLAUDE.md +64 -0
  69. package/dist/templates/cc-native/_cc-native/{lib-ts/artifacts → artifacts/lib}/format.ts +1 -1
  70. package/dist/templates/cc-native/_cc-native/{lib-ts/artifacts → artifacts/lib}/write.ts +2 -2
  71. package/dist/templates/cc-native/_cc-native/cc-native.config.json +96 -96
  72. package/dist/templates/cc-native/_cc-native/hooks/CLAUDE.md +14 -24
  73. package/dist/templates/cc-native/_cc-native/hooks/cc-native-plan-review.ts +1 -1
  74. package/dist/templates/cc-native/_cc-native/hooks/enhance_plan_post_subagent.ts +54 -54
  75. package/dist/templates/cc-native/_cc-native/hooks/enhance_plan_post_write.ts +51 -51
  76. package/dist/templates/cc-native/_cc-native/hooks/mark_questions_asked.ts +53 -53
  77. package/dist/templates/cc-native/_cc-native/hooks/plan_questions_early.ts +61 -61
  78. package/dist/templates/cc-native/_cc-native/hooks/validate_task_prompt.ts +76 -0
  79. package/dist/templates/cc-native/_cc-native/lib-ts/aggregate-agents.ts +9 -2
  80. package/dist/templates/cc-native/_cc-native/lib-ts/cc-native-state.ts +319 -319
  81. package/dist/templates/cc-native/_cc-native/lib-ts/cli-output-parser.ts +144 -144
  82. package/dist/templates/cc-native/_cc-native/lib-ts/config.ts +57 -57
  83. package/dist/templates/cc-native/_cc-native/lib-ts/constants.ts +83 -83
  84. package/dist/templates/cc-native/_cc-native/lib-ts/debug.ts +79 -79
  85. package/dist/templates/cc-native/_cc-native/lib-ts/index.ts +4 -4
  86. package/dist/templates/cc-native/_cc-native/lib-ts/json-parser.ts +168 -168
  87. package/dist/templates/cc-native/_cc-native/lib-ts/plan-discovery.ts +80 -80
  88. package/dist/templates/cc-native/_cc-native/lib-ts/plan-enhancement.ts +41 -41
  89. package/dist/templates/cc-native/_cc-native/lib-ts/rlm/CLAUDE.md +480 -480
  90. package/dist/templates/cc-native/_cc-native/lib-ts/rlm/embedding-indexer.ts +287 -287
  91. package/dist/templates/cc-native/_cc-native/lib-ts/rlm/hyde.ts +148 -148
  92. package/dist/templates/cc-native/_cc-native/lib-ts/rlm/index.ts +54 -54
  93. package/dist/templates/cc-native/_cc-native/lib-ts/rlm/logger.ts +58 -58
  94. package/dist/templates/cc-native/_cc-native/lib-ts/rlm/ollama-client.ts +208 -208
  95. package/dist/templates/cc-native/_cc-native/lib-ts/rlm/retrieval-pipeline.ts +460 -460
  96. package/dist/templates/cc-native/_cc-native/lib-ts/rlm/transcript-indexer.ts +446 -446
  97. package/dist/templates/cc-native/_cc-native/lib-ts/rlm/transcript-loader.ts +280 -280
  98. package/dist/templates/cc-native/_cc-native/lib-ts/rlm/transcript-searcher.ts +274 -274
  99. package/dist/templates/cc-native/_cc-native/lib-ts/rlm/types.ts +201 -201
  100. package/dist/templates/cc-native/_cc-native/lib-ts/rlm/vector-store.ts +278 -278
  101. package/dist/templates/cc-native/_cc-native/lib-ts/settings.ts +184 -184
  102. package/dist/templates/cc-native/_cc-native/lib-ts/state.ts +275 -275
  103. package/dist/templates/cc-native/_cc-native/lib-ts/tsconfig.json +18 -18
  104. package/dist/templates/cc-native/_cc-native/lib-ts/types.ts +1 -1
  105. package/dist/templates/cc-native/_cc-native/plan-review/CLAUDE.md +149 -0
  106. package/dist/templates/cc-native/_cc-native/plan-review/agents/CLAUDE.md +143 -0
  107. package/dist/templates/cc-native/_cc-native/plan-review/agents/PLAN-ORCHESTRATOR.md +213 -0
  108. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-questions/PLAN-QUESTIONER.md +70 -0
  109. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/ARCH-EVOLUTION.md +62 -0
  110. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/ARCH-PATTERNS.md +61 -0
  111. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/ARCH-STRUCTURE.md +62 -0
  112. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/ASSUMPTION-TRACER.md +56 -0
  113. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/CLARITY-AUDITOR.md +53 -0
  114. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/COMPLETENESS-FEASIBILITY.md +66 -0
  115. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/COMPLETENESS-GAPS.md +70 -0
  116. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/COMPLETENESS-ORDERING.md +62 -0
  117. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/CONSTRAINT-VALIDATOR.md +72 -0
  118. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/DESIGN-ADR-VALIDATOR.md +61 -0
  119. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/DESIGN-SCALE-MATCHER.md +64 -0
  120. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/DEVILS-ADVOCATE.md +56 -0
  121. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/DOCUMENTATION-PHILOSOPHY.md +86 -0
  122. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/HANDOFF-READINESS.md +59 -0
  123. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/HIDDEN-COMPLEXITY.md +58 -0
  124. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/INCREMENTAL-DELIVERY.md +66 -0
  125. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/RISK-DEPENDENCY.md +62 -0
  126. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/RISK-FMEA.md +66 -0
  127. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/RISK-PREMORTEM.md +71 -0
  128. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/RISK-REVERSIBILITY.md +74 -0
  129. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/SCOPE-BOUNDARY.md +77 -0
  130. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/SIMPLICITY-GUARDIAN.md +62 -0
  131. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/SKEPTIC.md +68 -0
  132. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/TESTDRIVEN-BEHAVIOR-AUDITOR.md +61 -0
  133. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/TESTDRIVEN-CHARACTERIZATION.md +71 -0
  134. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/TESTDRIVEN-FIRST-VALIDATOR.md +61 -0
  135. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/TESTDRIVEN-PYRAMID-ANALYZER.md +61 -0
  136. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/TRADEOFF-COSTS.md +67 -0
  137. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/TRADEOFF-STAKEHOLDERS.md +65 -0
  138. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/VERIFY-COVERAGE.md +74 -0
  139. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/VERIFY-STRENGTH.md +69 -0
  140. package/dist/templates/cc-native/_cc-native/{lib-ts → plan-review/lib}/agent-selection.ts +3 -3
  141. package/dist/templates/cc-native/_cc-native/{lib-ts → plan-review/lib}/corroboration.ts +1 -1
  142. package/dist/templates/cc-native/_cc-native/{lib-ts → plan-review/lib}/graduation.ts +1 -1
  143. package/dist/templates/cc-native/_cc-native/{lib-ts → plan-review/lib}/orchestrator.ts +2 -2
  144. package/dist/templates/cc-native/_cc-native/{lib-ts → plan-review/lib}/output-builder.ts +3 -3
  145. package/dist/templates/cc-native/_cc-native/{lib-ts → plan-review/lib}/plan-questions.ts +6 -6
  146. package/dist/templates/cc-native/_cc-native/{lib-ts → plan-review/lib}/review-pipeline.ts +15 -15
  147. package/dist/templates/cc-native/_cc-native/{lib-ts → plan-review/lib}/reviewers/agent.ts +5 -5
  148. package/dist/templates/cc-native/_cc-native/{lib-ts → plan-review/lib}/reviewers/base/base-agent.ts +4 -4
  149. package/dist/templates/cc-native/_cc-native/{lib-ts → plan-review/lib}/reviewers/providers/claude-agent.ts +4 -4
  150. package/dist/templates/cc-native/_cc-native/{lib-ts → plan-review/lib}/reviewers/providers/codex-agent.ts +6 -6
  151. package/dist/templates/cc-native/_cc-native/{lib-ts → plan-review/lib}/reviewers/providers/gemini-agent.ts +1 -1
  152. package/dist/templates/cc-native/_cc-native/{lib-ts → plan-review/lib}/reviewers/providers/orchestrator-claude-agent.ts +4 -4
  153. package/dist/templates/cc-native/_cc-native/{lib-ts → plan-review/lib}/reviewers/types.ts +3 -3
  154. package/dist/templates/cc-native/_cc-native/{lib-ts → plan-review/lib}/verdict.ts +1 -1
  155. package/oclif.manifest.json +1 -1
  156. package/package.json +108 -108
  157. package/dist/templates/cc-native/_cc-native/lib-ts/artifacts.ts +0 -21
  158. package/dist/templates/cc-native/_cc-native/lib-ts/nul +0 -3
  159. /package/dist/templates/cc-native/_cc-native/{lib-ts/artifacts → artifacts/lib}/index.ts +0 -0
  160. /package/dist/templates/cc-native/_cc-native/{lib-ts/artifacts → artifacts/lib}/tracker.ts +0 -0
  161. /package/dist/templates/cc-native/_cc-native/{lib-ts → plan-review/lib}/reviewers/index.ts +0 -0
  162. /package/dist/templates/cc-native/_cc-native/{lib-ts → plan-review/lib}/reviewers/schemas.ts +0 -0
  163. /package/dist/templates/cc-native/_cc-native/{workflows → plan-review/workflows}/specdev.md +0 -0
@@ -1,301 +1,301 @@
1
- /**
2
- * Inference utility for AI-powered text processing.
3
- * Unified interface for Claude API calls using the claude CLI.
4
- * See SPEC.md §6
5
- */
6
-
7
- import { execFileSync } from "node:child_process";
8
- import { logDebug, logWarn } from "./logger.js";
9
- import { STOP_WORDS } from "./stop-words.js";
10
- import type { InferenceResult } from "../types.js";
11
- import { execFileAsync, getInternalSubprocessEnv, shellQuoteWin } from "./subprocess-utils.js";
12
-
13
- // Model configurations §6.1
14
- const MODELS: Record<string, string> = {
15
- fast: "claude-3-haiku-20240307",
16
- standard: "claude-sonnet-4-20250514",
17
- smart: "claude-opus-4-20250514",
18
- };
19
-
20
- const TIMEOUTS: Record<string, number> = {
21
- fast: 15,
22
- standard: 30,
23
- smart: 90,
24
- };
25
-
26
- /**
27
- * Run inference using the claude CLI.
28
- * See SPEC.md §6.1
29
- */
30
- export function inference(
31
- systemPrompt: string,
32
- userPrompt: string,
33
- level = "fast",
34
- timeout?: number,
35
- ): InferenceResult {
36
- const startTime = Date.now();
37
- const model = MODELS[level] ?? MODELS.fast;
38
- const timeoutSec = timeout ?? TIMEOUTS[level] ?? TIMEOUTS.fast;
39
- const fullPrompt = `${systemPrompt}\n\n${userPrompt}`;
40
-
41
- // Remove ANTHROPIC_API_KEY to force subscription auth
42
- const env = { ...process.env };
43
- delete env.ANTHROPIC_API_KEY;
44
-
45
- try {
46
- const isWin = process.platform === "win32";
47
- let stdout: string;
48
-
49
- // On Windows with shell:true, Node.js sets windowsVerbatimArguments —
50
- // args are joined with spaces, NOT individually quoted. We must manually
51
- // wrap multi-word/special-char args in "..." for cmd.exe parsing.
52
- // Inside double quotes: "" = literal ", and |&<> are safe.
53
- const empty = isWin ? '""' : "";
54
- let promptArg = fullPrompt;
55
- if (isWin) {
56
- promptArg = '"' + fullPrompt.replace(/\r?\n/g, " ").replace(/"/g, '""') + '"';
57
- }
58
-
59
- stdout = execFileSync(
60
- "claude",
61
- ["--model", model, "--print", "--setting-sources", empty, "-p", "--no-session-persistence", promptArg],
62
- {
63
- timeout: timeoutSec * 1000,
64
- env,
65
- encoding: "utf-8",
66
- stdio: ["pipe", "pipe", "pipe"],
67
- shell: isWin, // Windows needs shell for .cmd resolution
68
- },
69
- );
70
-
71
- const latencyMs = Date.now() - startTime;
72
- return {
73
- success: true,
74
- output: stdout.trim(),
75
- latency_ms: latencyMs,
76
- };
77
- } catch (e: any) {
78
- const latencyMs = Date.now() - startTime;
79
-
80
- if (e.code === "ETIMEDOUT" || e.killed) {
81
- return {
82
- success: false,
83
- output: "",
84
- error: `Timeout after ${timeoutSec}s`,
85
- latency_ms: latencyMs,
86
- };
87
- }
88
-
89
- if (e.code === "ENOENT") {
90
- return {
91
- success: false,
92
- output: "",
93
- error: "claude CLI not found",
94
- latency_ms: latencyMs,
95
- };
96
- }
97
-
98
- // Non-zero exit code
99
- if (e.status !== undefined && e.status !== 0) {
100
- return {
101
- success: false,
102
- output: (e.stdout ?? "").toString().trim(),
103
- error: (e.stderr ?? "").toString().trim() || `Exit code: ${e.status}`,
104
- latency_ms: latencyMs,
105
- };
106
- }
107
-
108
- return {
109
- success: false,
110
- output: "",
111
- error: String(e),
112
- latency_ms: latencyMs,
113
- };
114
- }
115
- }
116
-
117
- // §6.2 — System prompt for keyword extraction
118
- const CONTEXT_ID_SYSTEM_PROMPT = `Extract 6-12 keywords from what the user wants to do.
119
-
120
- Rules:
121
- - Output 6-12 keywords only
122
- - Keywords: nouns, verbs, adjectives, technical terms, proper names
123
- - NO function words: the, to, with, for, in, a, an, of, on, is, it, and, or, that, this, be, as, at, by, from
124
- - Most important/specific words preferred
125
- - No punctuation, no quotes
126
-
127
- Output ONLY the keywords separated by spaces, nothing else.`;
128
-
129
- /**
130
- * Generate a keyword summary of a user prompt.
131
- * Uses Sonnet (standard tier). Returns null if inference fails.
132
- * See SPEC.md §6.2
133
- */
134
- export function generateSemanticSummary(
135
- prompt: string,
136
- timeout = 15,
137
- ): string | null {
138
- const result = inference(CONTEXT_ID_SYSTEM_PROMPT, prompt, "standard", timeout);
139
-
140
- if (!result.success || !result.output) return null;
141
-
142
- let summary = result.output.trim();
143
- summary = summary.replace(/^["']+|["']+$/g, "");
144
- summary = summary.replace(/[.!?]+$/, "");
145
-
146
- // Filter stop words
147
- summary = filterStopWords(summary);
148
-
149
- const words = summary.split(/\s+/);
150
- if (words.length < 6 || words.length > 12) return null;
151
-
152
- return summary;
153
- }
154
-
155
- // §6.3 — System prompt for context ID slug generation
156
- const CONTEXT_ID_SLUG_PROMPT = `You generate short title phrases for work sessions. These become folder names like \`260206-1959-fix-auth-middleware-redirect-loop-session-timeout\`.
157
-
158
- Users scan 100+ such names to find past sessions. Your title must make THIS session instantly recognizable.
159
-
160
- Rules:
161
- - Exactly 8-12 lowercase words
162
- - First word is an action verb (fix, add, implement, refactor, update, create, remove, optimize, debug, migrate, integrate, configure, deploy, scaffold, restructure)
163
- - Coherent phrase, not disjointed keywords — reads like a short task description
164
- - Prefer specific technical terms over generic words
165
- - No articles (the, a, an), no pronouns, no filler words, no punctuation, no quotes
166
- - Input may come from speech-to-text with filler words (uh, um, like, you know, basically, so) — ignore them entirely
167
-
168
- Examples:
169
-
170
- Input: "um so basically I need to like fix the auth bug in the login page"
171
- {"slug": "fix authentication bug login page redirect session handling flow"}
172
-
173
- Input: "hey uh can we add dark mode to the settings page"
174
- {"slug": "add dark mode toggle settings page user preference storage"}
175
-
176
- Input: "the context ids are bad can we change how we generate them towards a summary"
177
- {"slug": "improve context id generation use prompt summary slugs"}
178
-
179
- Input: "I want to refactor the database connection pooling for PostgreSQL"
180
- {"slug": "refactor postgresql database connection pooling optimize query performance"}
181
-
182
- Input: "so like you know the webhook retry logic is broken and stuff"
183
- {"slug": "fix webhook retry logic broken error handling recovery mechanism"}
184
-
185
- Input: "update the CI pipeline to cache node modules between runs"
186
- {"slug": "update ci pipeline cache node modules between workflow runs"}
187
-
188
- Respond with ONLY a JSON object: {"slug": "your 8-12 word phrase here"}`;
189
-
190
- /**
191
- * Generate a 5-12 word context ID slug from a user prompt.
192
- * Uses Haiku (fast tier) for low latency.
193
- * See SPEC.md §6.3
194
- */
195
- export function generateContextIdSlug(
196
- prompt: string,
197
- timeout = 3,
198
- ): string | null {
199
- const truncated = prompt.slice(0, 500);
200
-
201
- const result = inference(CONTEXT_ID_SLUG_PROMPT, truncated, "fast", timeout);
202
-
203
- if (!result.success || !result.output) {
204
- logWarn("inference", `Context ID slug inference failed: ${result.error}`);
205
- return null;
206
- }
207
-
208
- const raw = result.output.trim();
209
-
210
- // Parse JSON response, fall back to raw text
211
- let slug: string | null = null;
212
- try {
213
- const parsed = JSON.parse(raw);
214
- if (parsed && typeof parsed === "object" && "slug" in parsed) {
215
- slug = parsed.slug;
216
- }
217
- } catch {
218
- // Fall through to raw text
219
- }
220
-
221
- if (!slug) slug = raw;
222
-
223
- // Clean up
224
- slug = slug.replace(/^["'`]+|["'`]+$/g, "");
225
- slug = slug.replace(/[.!?]+$/, "");
226
- slug = slug.replace(/-/g, " ");
227
- slug = slug.replace(/[^a-zA-Z0-9 ]/g, "");
228
- slug = slug.replace(/\s+/g, " ").trim();
229
-
230
- const words = slug.split(" ");
231
-
232
- if (words.length > 12) words.length = 12;
233
- if (words.length < 5) {
234
- logDebug("inference", `Context ID slug too short (${words.length} words): '${slug}'`);
235
- return null;
236
- }
237
-
238
- const resultSlug = words.join(" ");
239
- logDebug("inference", `Generated context ID slug: '${resultSlug}' (${result.latency_ms}ms)`);
240
- return resultSlug;
241
- }
242
-
243
- /**
244
- * Async version of inference() that does NOT block the event loop.
245
- * Use for parallel AI calls (e.g., Stage 3 parallel summarizers).
246
- * Uses execFileAsync and getInternalSubprocessEnv for proper subprocess isolation.
247
- */
248
- export async function inferenceAsync(
249
- systemPrompt: string,
250
- userPrompt: string,
251
- level = "fast",
252
- timeout?: number,
253
- ): Promise<InferenceResult> {
254
- const startTime = Date.now();
255
- const model = (level in MODELS ? MODELS[level] : undefined) ?? MODELS.fast;
256
- const timeoutSec = timeout ?? (level in TIMEOUTS ? TIMEOUTS[level] : undefined) ?? TIMEOUTS.fast;
257
- const timeoutMs = timeoutSec * 1000;
258
- const fullPrompt = `${systemPrompt}\n\n${userPrompt}`;
259
-
260
- const env = getInternalSubprocessEnv();
261
- delete env.ANTHROPIC_API_KEY;
262
-
263
- const isWin = process.platform === "win32";
264
- const empty = isWin ? '""' : "";
265
- const promptArg = isWin
266
- ? shellQuoteWin(fullPrompt.replace(/\r?\n/g, " "))
267
- : fullPrompt;
268
-
269
- const result = await execFileAsync(
270
- "claude",
271
- ["--model", model, "--print", "--setting-sources", empty, "-p", "--no-session-persistence", promptArg],
272
- { timeout: timeoutMs, env, shell: isWin },
273
- );
274
-
275
- const latencyMs = Date.now() - startTime;
276
-
277
- if (result.killed) {
278
- return { success: false, output: "", error: `Timeout after ${timeoutSec}s`, latency_ms: latencyMs };
279
- }
280
- if (result.exitCode !== 0) {
281
- return {
282
- success: false,
283
- output: result.stdout.trim(),
284
- error: result.stderr.trim() || `Exit code: ${result.exitCode}`,
285
- latency_ms: latencyMs,
286
- };
287
- }
288
- return { success: true, output: result.stdout.trim(), latency_ms: latencyMs };
289
- }
290
-
291
- /**
292
- * Filter stop words from text.
293
- * See SPEC.md §6.4
294
- */
295
- function filterStopWords(text: string): string {
296
- return text
297
- .toLowerCase()
298
- .split(/\s+/)
299
- .filter((w) => !STOP_WORDS.has(w) && w.length > 1)
300
- .join(" ");
301
- }
1
+ /**
2
+ * Inference utility for AI-powered text processing.
3
+ * Unified interface for Claude API calls using the claude CLI.
4
+ * See SPEC.md §6
5
+ */
6
+
7
+ import { execFileSync } from "node:child_process";
8
+ import { logDebug, logWarn } from "./logger.js";
9
+ import { STOP_WORDS } from "./stop-words.js";
10
+ import type { InferenceResult } from "../types.js";
11
+ import { execFileAsync, getInternalSubprocessEnv, shellQuoteWin } from "./subprocess-utils.js";
12
+
13
+ // Model configurations §6.1
14
+ const MODELS: Record<string, string> = {
15
+ fast: "claude-haiku-4-5-20251001",
16
+ standard: "claude-sonnet-4-6",
17
+ smart: "claude-opus-4-6",
18
+ };
19
+
20
+ const TIMEOUTS: Record<string, number> = {
21
+ fast: 15,
22
+ standard: 30,
23
+ smart: 90,
24
+ };
25
+
26
+ /**
27
+ * Run inference using the claude CLI.
28
+ * See SPEC.md §6.1
29
+ */
30
+ export function inference(
31
+ systemPrompt: string,
32
+ userPrompt: string,
33
+ level = "fast",
34
+ timeout?: number,
35
+ ): InferenceResult {
36
+ const startTime = Date.now();
37
+ const model = MODELS[level] ?? MODELS.fast;
38
+ const timeoutSec = timeout ?? TIMEOUTS[level] ?? TIMEOUTS.fast;
39
+ const fullPrompt = `${systemPrompt}\n\n${userPrompt}`;
40
+
41
+ // Remove ANTHROPIC_API_KEY to force subscription auth
42
+ const env = { ...process.env };
43
+ delete env.ANTHROPIC_API_KEY;
44
+
45
+ try {
46
+ const isWin = process.platform === "win32";
47
+ let stdout: string;
48
+
49
+ // On Windows with shell:true, Node.js sets windowsVerbatimArguments —
50
+ // args are joined with spaces, NOT individually quoted. We must manually
51
+ // wrap multi-word/special-char args in "..." for cmd.exe parsing.
52
+ // Inside double quotes: "" = literal ", and |&<> are safe.
53
+ const empty = isWin ? '""' : "";
54
+ let promptArg = fullPrompt;
55
+ if (isWin) {
56
+ promptArg = '"' + fullPrompt.replace(/\r?\n/g, " ").replace(/"/g, '""') + '"';
57
+ }
58
+
59
+ stdout = execFileSync(
60
+ "claude",
61
+ ["--model", model, "--print", "--setting-sources", empty, "-p", "--no-session-persistence", promptArg],
62
+ {
63
+ timeout: timeoutSec * 1000,
64
+ env,
65
+ encoding: "utf-8",
66
+ stdio: ["pipe", "pipe", "pipe"],
67
+ shell: isWin, // Windows needs shell for .cmd resolution
68
+ },
69
+ );
70
+
71
+ const latencyMs = Date.now() - startTime;
72
+ return {
73
+ success: true,
74
+ output: stdout.trim(),
75
+ latency_ms: latencyMs,
76
+ };
77
+ } catch (e: any) {
78
+ const latencyMs = Date.now() - startTime;
79
+
80
+ if (e.code === "ETIMEDOUT" || e.killed) {
81
+ return {
82
+ success: false,
83
+ output: "",
84
+ error: `Timeout after ${timeoutSec}s`,
85
+ latency_ms: latencyMs,
86
+ };
87
+ }
88
+
89
+ if (e.code === "ENOENT") {
90
+ return {
91
+ success: false,
92
+ output: "",
93
+ error: "claude CLI not found",
94
+ latency_ms: latencyMs,
95
+ };
96
+ }
97
+
98
+ // Non-zero exit code
99
+ if (e.status !== undefined && e.status !== 0) {
100
+ return {
101
+ success: false,
102
+ output: (e.stdout ?? "").toString().trim(),
103
+ error: (e.stderr ?? "").toString().trim() || `Exit code: ${e.status}`,
104
+ latency_ms: latencyMs,
105
+ };
106
+ }
107
+
108
+ return {
109
+ success: false,
110
+ output: "",
111
+ error: String(e),
112
+ latency_ms: latencyMs,
113
+ };
114
+ }
115
+ }
116
+
117
+ // §6.2 — System prompt for keyword extraction
118
+ const CONTEXT_ID_SYSTEM_PROMPT = `Extract 6-12 keywords from what the user wants to do.
119
+
120
+ Rules:
121
+ - Output 6-12 keywords only
122
+ - Keywords: nouns, verbs, adjectives, technical terms, proper names
123
+ - NO function words: the, to, with, for, in, a, an, of, on, is, it, and, or, that, this, be, as, at, by, from
124
+ - Most important/specific words preferred
125
+ - No punctuation, no quotes
126
+
127
+ Output ONLY the keywords separated by spaces, nothing else.`;
128
+
129
+ /**
130
+ * Generate a keyword summary of a user prompt.
131
+ * Uses Sonnet (standard tier). Returns null if inference fails.
132
+ * See SPEC.md §6.2
133
+ */
134
+ export function generateSemanticSummary(
135
+ prompt: string,
136
+ timeout = 15,
137
+ ): string | null {
138
+ const result = inference(CONTEXT_ID_SYSTEM_PROMPT, prompt, "standard", timeout);
139
+
140
+ if (!result.success || !result.output) return null;
141
+
142
+ let summary = result.output.trim();
143
+ summary = summary.replace(/^["']+|["']+$/g, "");
144
+ summary = summary.replace(/[.!?]+$/, "");
145
+
146
+ // Filter stop words
147
+ summary = filterStopWords(summary);
148
+
149
+ const words = summary.split(/\s+/);
150
+ if (words.length < 6 || words.length > 12) return null;
151
+
152
+ return summary;
153
+ }
154
+
155
+ // §6.3 — System prompt for context ID slug generation
156
+ const CONTEXT_ID_SLUG_PROMPT = `You generate short title phrases for work sessions. These become folder names like \`260206-1959-fix-auth-middleware-redirect-loop-session-timeout\`.
157
+
158
+ Users scan 100+ such names to find past sessions. Your title must make THIS session instantly recognizable.
159
+
160
+ Rules:
161
+ - Exactly 8-12 lowercase words
162
+ - First word is an action verb (fix, add, implement, refactor, update, create, remove, optimize, debug, migrate, integrate, configure, deploy, scaffold, restructure)
163
+ - Coherent phrase, not disjointed keywords — reads like a short task description
164
+ - Prefer specific technical terms over generic words
165
+ - No articles (the, a, an), no pronouns, no filler words, no punctuation, no quotes
166
+ - Input may come from speech-to-text with filler words (uh, um, like, you know, basically, so) — ignore them entirely
167
+
168
+ Examples:
169
+
170
+ Input: "um so basically I need to like fix the auth bug in the login page"
171
+ {"slug": "fix authentication bug login page redirect session handling flow"}
172
+
173
+ Input: "hey uh can we add dark mode to the settings page"
174
+ {"slug": "add dark mode toggle settings page user preference storage"}
175
+
176
+ Input: "the context ids are bad can we change how we generate them towards a summary"
177
+ {"slug": "improve context id generation use prompt summary slugs"}
178
+
179
+ Input: "I want to refactor the database connection pooling for PostgreSQL"
180
+ {"slug": "refactor postgresql database connection pooling optimize query performance"}
181
+
182
+ Input: "so like you know the webhook retry logic is broken and stuff"
183
+ {"slug": "fix webhook retry logic broken error handling recovery mechanism"}
184
+
185
+ Input: "update the CI pipeline to cache node modules between runs"
186
+ {"slug": "update ci pipeline cache node modules between workflow runs"}
187
+
188
+ Respond with ONLY a JSON object: {"slug": "your 8-12 word phrase here"}`;
189
+
190
+ /**
191
+ * Generate a 5-12 word context ID slug from a user prompt.
192
+ * Uses Haiku (fast tier) for low latency.
193
+ * See SPEC.md §6.3
194
+ */
195
+ export function generateContextIdSlug(
196
+ prompt: string,
197
+ timeout = 3,
198
+ ): string | null {
199
+ const truncated = prompt.slice(0, 500);
200
+
201
+ const result = inference(CONTEXT_ID_SLUG_PROMPT, truncated, "fast", timeout);
202
+
203
+ if (!result.success || !result.output) {
204
+ logWarn("inference", `Context ID slug inference failed: ${result.error}`);
205
+ return null;
206
+ }
207
+
208
+ const raw = result.output.trim();
209
+
210
+ // Parse JSON response, fall back to raw text
211
+ let slug: string | null = null;
212
+ try {
213
+ const parsed = JSON.parse(raw);
214
+ if (parsed && typeof parsed === "object" && "slug" in parsed) {
215
+ slug = parsed.slug;
216
+ }
217
+ } catch {
218
+ // Fall through to raw text
219
+ }
220
+
221
+ if (!slug) slug = raw;
222
+
223
+ // Clean up
224
+ slug = slug.replace(/^["'`]+|["'`]+$/g, "");
225
+ slug = slug.replace(/[.!?]+$/, "");
226
+ slug = slug.replace(/-/g, " ");
227
+ slug = slug.replace(/[^a-zA-Z0-9 ]/g, "");
228
+ slug = slug.replace(/\s+/g, " ").trim();
229
+
230
+ const words = slug.split(" ");
231
+
232
+ if (words.length > 12) words.length = 12;
233
+ if (words.length < 5) {
234
+ logDebug("inference", `Context ID slug too short (${words.length} words): '${slug}'`);
235
+ return null;
236
+ }
237
+
238
+ const resultSlug = words.join(" ");
239
+ logDebug("inference", `Generated context ID slug: '${resultSlug}' (${result.latency_ms}ms)`);
240
+ return resultSlug;
241
+ }
242
+
243
+ /**
244
+ * Async version of inference() that does NOT block the event loop.
245
+ * Use for parallel AI calls (e.g., Stage 3 parallel summarizers).
246
+ * Uses execFileAsync and getInternalSubprocessEnv for proper subprocess isolation.
247
+ */
248
+ export async function inferenceAsync(
249
+ systemPrompt: string,
250
+ userPrompt: string,
251
+ level = "fast",
252
+ timeout?: number,
253
+ ): Promise<InferenceResult> {
254
+ const startTime = Date.now();
255
+ const model = (level in MODELS ? MODELS[level] : undefined) ?? MODELS.fast;
256
+ const timeoutSec = timeout ?? (level in TIMEOUTS ? TIMEOUTS[level] : undefined) ?? TIMEOUTS.fast;
257
+ const timeoutMs = timeoutSec * 1000;
258
+ const fullPrompt = `${systemPrompt}\n\n${userPrompt}`;
259
+
260
+ const env = getInternalSubprocessEnv();
261
+ delete env.ANTHROPIC_API_KEY;
262
+
263
+ const isWin = process.platform === "win32";
264
+ const empty = isWin ? '""' : "";
265
+ const promptArg = isWin
266
+ ? shellQuoteWin(fullPrompt.replace(/\r?\n/g, " "))
267
+ : fullPrompt;
268
+
269
+ const result = await execFileAsync(
270
+ "claude",
271
+ ["--model", model, "--print", "--setting-sources", empty, "-p", "--no-session-persistence", promptArg],
272
+ { timeout: timeoutMs, env, shell: isWin },
273
+ );
274
+
275
+ const latencyMs = Date.now() - startTime;
276
+
277
+ if (result.killed) {
278
+ return { success: false, output: "", error: `Timeout after ${timeoutSec}s`, latency_ms: latencyMs };
279
+ }
280
+ if (result.exitCode !== 0) {
281
+ return {
282
+ success: false,
283
+ output: result.stdout.trim(),
284
+ error: result.stderr.trim() || `Exit code: ${result.exitCode}`,
285
+ latency_ms: latencyMs,
286
+ };
287
+ }
288
+ return { success: true, output: result.stdout.trim(), latency_ms: latencyMs };
289
+ }
290
+
291
+ /**
292
+ * Filter stop words from text.
293
+ * See SPEC.md §6.4
294
+ */
295
+ function filterStopWords(text: string): string {
296
+ return text
297
+ .toLowerCase()
298
+ .split(/\s+/)
299
+ .filter((w) => !STOP_WORDS.has(w) && w.length > 1)
300
+ .join(" ");
301
+ }