aiwcli 0.12.6 → 0.12.8

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (163) hide show
  1. package/bin/dev.cmd +3 -3
  2. package/bin/dev.js +16 -16
  3. package/bin/run.cmd +3 -3
  4. package/bin/run.js +21 -21
  5. package/dist/commands/branch.js +7 -2
  6. package/dist/lib/bmad-installer.js +37 -37
  7. package/dist/lib/terminal.d.ts +2 -0
  8. package/dist/lib/terminal.js +57 -7
  9. package/dist/templates/CLAUDE.md +232 -205
  10. package/dist/templates/_shared/.claude/settings.json +65 -65
  11. package/dist/templates/_shared/.claude/{commands/handoff.md → skills/handoff/SKILL.md} +13 -12
  12. package/dist/templates/_shared/.claude/{commands/handoff-resume.md → skills/handoff-resume/SKILL.md} +13 -12
  13. package/dist/templates/_shared/.codex/workflows/handoff.md +226 -226
  14. package/dist/templates/_shared/.windsurf/workflows/handoff.md +226 -226
  15. package/dist/templates/_shared/handoff-system/CLAUDE.md +15 -3
  16. package/dist/templates/_shared/handoff-system/lib/document-generator.ts +215 -215
  17. package/dist/templates/_shared/handoff-system/lib/handoff-reader.ts +158 -158
  18. package/dist/templates/_shared/handoff-system/scripts/resume_handoff.ts +373 -373
  19. package/dist/templates/_shared/handoff-system/scripts/save_handoff.ts +469 -469
  20. package/dist/templates/_shared/handoff-system/workflows/handoff-resume.md +66 -66
  21. package/dist/templates/_shared/handoff-system/workflows/handoff.md +254 -254
  22. package/dist/templates/_shared/hooks-ts/_utils/git-state.ts +2 -2
  23. package/dist/templates/_shared/hooks-ts/archive_plan.ts +159 -159
  24. package/dist/templates/_shared/hooks-ts/context_monitor.ts +147 -147
  25. package/dist/templates/_shared/hooks-ts/file-suggestion.ts +128 -128
  26. package/dist/templates/_shared/hooks-ts/pre_compact.ts +49 -49
  27. package/dist/templates/_shared/hooks-ts/session_end.ts +196 -196
  28. package/dist/templates/_shared/hooks-ts/session_start.ts +163 -163
  29. package/dist/templates/_shared/hooks-ts/task_create_capture.ts +48 -48
  30. package/dist/templates/_shared/hooks-ts/task_update_capture.ts +74 -74
  31. package/dist/templates/_shared/hooks-ts/user_prompt_submit.ts +93 -93
  32. package/dist/templates/_shared/lib-ts/CLAUDE.md +367 -367
  33. package/dist/templates/_shared/lib-ts/base/atomic-write.ts +138 -138
  34. package/dist/templates/_shared/lib-ts/base/constants.ts +24 -6
  35. package/dist/templates/_shared/lib-ts/base/git-state.ts +58 -58
  36. package/dist/templates/_shared/lib-ts/base/hook-utils.ts +582 -582
  37. package/dist/templates/_shared/lib-ts/base/inference.ts +301 -301
  38. package/dist/templates/_shared/lib-ts/base/logger.ts +247 -247
  39. package/dist/templates/_shared/lib-ts/base/state-io.ts +202 -202
  40. package/dist/templates/_shared/lib-ts/base/stop-words.ts +184 -184
  41. package/dist/templates/_shared/lib-ts/base/utils.ts +184 -184
  42. package/dist/templates/_shared/lib-ts/context/CLAUDE.md +134 -0
  43. package/dist/templates/_shared/lib-ts/context/context-formatter.ts +566 -566
  44. package/dist/templates/_shared/lib-ts/context/context-selector.ts +524 -524
  45. package/dist/templates/_shared/lib-ts/context/context-store.ts +712 -712
  46. package/dist/templates/_shared/lib-ts/context/plan-manager.ts +312 -312
  47. package/dist/templates/_shared/lib-ts/context/task-tracker.ts +185 -185
  48. package/dist/templates/_shared/lib-ts/package.json +20 -20
  49. package/dist/templates/_shared/lib-ts/templates/formatters.ts +102 -102
  50. package/dist/templates/_shared/lib-ts/templates/plan-context.ts +58 -58
  51. package/dist/templates/_shared/lib-ts/tsconfig.json +13 -13
  52. package/dist/templates/_shared/lib-ts/types.ts +186 -186
  53. package/dist/templates/_shared/scripts/resolve_context.ts +33 -33
  54. package/dist/templates/_shared/scripts/status_line.ts +687 -690
  55. package/dist/templates/cc-native/.claude/commands/cc-native/rlm/ask.md +136 -136
  56. package/dist/templates/cc-native/.claude/commands/cc-native/rlm/index.md +21 -21
  57. package/dist/templates/cc-native/.claude/commands/cc-native/rlm/overview.md +56 -56
  58. package/dist/templates/cc-native/.claude/commands/cc-native/specdev.md +10 -10
  59. package/dist/templates/cc-native/.claude/settings.json +3 -2
  60. package/dist/templates/cc-native/.windsurf/workflows/cc-native/fix.md +8 -8
  61. package/dist/templates/cc-native/.windsurf/workflows/cc-native/implement.md +8 -8
  62. package/dist/templates/cc-native/.windsurf/workflows/cc-native/research.md +8 -8
  63. package/dist/templates/cc-native/CC-NATIVE-README.md +189 -189
  64. package/dist/templates/cc-native/TEMPLATE-SCHEMA.md +304 -304
  65. package/dist/templates/cc-native/_cc-native/agents/CLAUDE.md +143 -143
  66. package/dist/templates/cc-native/_cc-native/agents/PLAN-ORCHESTRATOR.md +213 -213
  67. package/dist/templates/cc-native/_cc-native/agents/plan-questions/PLAN-QUESTIONER.md +70 -70
  68. package/dist/templates/cc-native/_cc-native/artifacts/CLAUDE.md +64 -0
  69. package/dist/templates/cc-native/_cc-native/{lib-ts/artifacts → artifacts/lib}/format.ts +1 -1
  70. package/dist/templates/cc-native/_cc-native/{lib-ts/artifacts → artifacts/lib}/write.ts +2 -2
  71. package/dist/templates/cc-native/_cc-native/cc-native.config.json +96 -96
  72. package/dist/templates/cc-native/_cc-native/hooks/CLAUDE.md +14 -24
  73. package/dist/templates/cc-native/_cc-native/hooks/cc-native-plan-review.ts +1 -1
  74. package/dist/templates/cc-native/_cc-native/hooks/enhance_plan_post_subagent.ts +54 -54
  75. package/dist/templates/cc-native/_cc-native/hooks/enhance_plan_post_write.ts +51 -51
  76. package/dist/templates/cc-native/_cc-native/hooks/mark_questions_asked.ts +53 -53
  77. package/dist/templates/cc-native/_cc-native/hooks/plan_questions_early.ts +61 -61
  78. package/dist/templates/cc-native/_cc-native/hooks/validate_task_prompt.ts +76 -0
  79. package/dist/templates/cc-native/_cc-native/lib-ts/aggregate-agents.ts +9 -2
  80. package/dist/templates/cc-native/_cc-native/lib-ts/cc-native-state.ts +319 -319
  81. package/dist/templates/cc-native/_cc-native/lib-ts/cli-output-parser.ts +144 -144
  82. package/dist/templates/cc-native/_cc-native/lib-ts/config.ts +57 -57
  83. package/dist/templates/cc-native/_cc-native/lib-ts/constants.ts +83 -83
  84. package/dist/templates/cc-native/_cc-native/lib-ts/debug.ts +79 -79
  85. package/dist/templates/cc-native/_cc-native/lib-ts/index.ts +4 -4
  86. package/dist/templates/cc-native/_cc-native/lib-ts/json-parser.ts +168 -168
  87. package/dist/templates/cc-native/_cc-native/lib-ts/plan-discovery.ts +80 -80
  88. package/dist/templates/cc-native/_cc-native/lib-ts/plan-enhancement.ts +41 -41
  89. package/dist/templates/cc-native/_cc-native/lib-ts/rlm/CLAUDE.md +480 -480
  90. package/dist/templates/cc-native/_cc-native/lib-ts/rlm/embedding-indexer.ts +287 -287
  91. package/dist/templates/cc-native/_cc-native/lib-ts/rlm/hyde.ts +148 -148
  92. package/dist/templates/cc-native/_cc-native/lib-ts/rlm/index.ts +54 -54
  93. package/dist/templates/cc-native/_cc-native/lib-ts/rlm/logger.ts +58 -58
  94. package/dist/templates/cc-native/_cc-native/lib-ts/rlm/ollama-client.ts +208 -208
  95. package/dist/templates/cc-native/_cc-native/lib-ts/rlm/retrieval-pipeline.ts +460 -460
  96. package/dist/templates/cc-native/_cc-native/lib-ts/rlm/transcript-indexer.ts +446 -446
  97. package/dist/templates/cc-native/_cc-native/lib-ts/rlm/transcript-loader.ts +280 -280
  98. package/dist/templates/cc-native/_cc-native/lib-ts/rlm/transcript-searcher.ts +274 -274
  99. package/dist/templates/cc-native/_cc-native/lib-ts/rlm/types.ts +201 -201
  100. package/dist/templates/cc-native/_cc-native/lib-ts/rlm/vector-store.ts +278 -278
  101. package/dist/templates/cc-native/_cc-native/lib-ts/settings.ts +184 -184
  102. package/dist/templates/cc-native/_cc-native/lib-ts/state.ts +275 -275
  103. package/dist/templates/cc-native/_cc-native/lib-ts/tsconfig.json +18 -18
  104. package/dist/templates/cc-native/_cc-native/lib-ts/types.ts +1 -1
  105. package/dist/templates/cc-native/_cc-native/plan-review/CLAUDE.md +149 -0
  106. package/dist/templates/cc-native/_cc-native/plan-review/agents/CLAUDE.md +143 -0
  107. package/dist/templates/cc-native/_cc-native/plan-review/agents/PLAN-ORCHESTRATOR.md +213 -0
  108. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-questions/PLAN-QUESTIONER.md +70 -0
  109. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/ARCH-EVOLUTION.md +62 -0
  110. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/ARCH-PATTERNS.md +61 -0
  111. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/ARCH-STRUCTURE.md +62 -0
  112. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/ASSUMPTION-TRACER.md +56 -0
  113. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/CLARITY-AUDITOR.md +53 -0
  114. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/COMPLETENESS-FEASIBILITY.md +66 -0
  115. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/COMPLETENESS-GAPS.md +70 -0
  116. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/COMPLETENESS-ORDERING.md +62 -0
  117. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/CONSTRAINT-VALIDATOR.md +72 -0
  118. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/DESIGN-ADR-VALIDATOR.md +61 -0
  119. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/DESIGN-SCALE-MATCHER.md +64 -0
  120. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/DEVILS-ADVOCATE.md +56 -0
  121. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/DOCUMENTATION-PHILOSOPHY.md +86 -0
  122. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/HANDOFF-READINESS.md +59 -0
  123. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/HIDDEN-COMPLEXITY.md +58 -0
  124. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/INCREMENTAL-DELIVERY.md +66 -0
  125. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/RISK-DEPENDENCY.md +62 -0
  126. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/RISK-FMEA.md +66 -0
  127. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/RISK-PREMORTEM.md +71 -0
  128. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/RISK-REVERSIBILITY.md +74 -0
  129. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/SCOPE-BOUNDARY.md +77 -0
  130. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/SIMPLICITY-GUARDIAN.md +62 -0
  131. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/SKEPTIC.md +68 -0
  132. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/TESTDRIVEN-BEHAVIOR-AUDITOR.md +61 -0
  133. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/TESTDRIVEN-CHARACTERIZATION.md +71 -0
  134. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/TESTDRIVEN-FIRST-VALIDATOR.md +61 -0
  135. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/TESTDRIVEN-PYRAMID-ANALYZER.md +61 -0
  136. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/TRADEOFF-COSTS.md +67 -0
  137. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/TRADEOFF-STAKEHOLDERS.md +65 -0
  138. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/VERIFY-COVERAGE.md +74 -0
  139. package/dist/templates/cc-native/_cc-native/plan-review/agents/plan-review/VERIFY-STRENGTH.md +69 -0
  140. package/dist/templates/cc-native/_cc-native/{lib-ts → plan-review/lib}/agent-selection.ts +3 -3
  141. package/dist/templates/cc-native/_cc-native/{lib-ts → plan-review/lib}/corroboration.ts +1 -1
  142. package/dist/templates/cc-native/_cc-native/{lib-ts → plan-review/lib}/graduation.ts +1 -1
  143. package/dist/templates/cc-native/_cc-native/{lib-ts → plan-review/lib}/orchestrator.ts +2 -2
  144. package/dist/templates/cc-native/_cc-native/{lib-ts → plan-review/lib}/output-builder.ts +3 -3
  145. package/dist/templates/cc-native/_cc-native/{lib-ts → plan-review/lib}/plan-questions.ts +6 -6
  146. package/dist/templates/cc-native/_cc-native/{lib-ts → plan-review/lib}/review-pipeline.ts +15 -15
  147. package/dist/templates/cc-native/_cc-native/{lib-ts → plan-review/lib}/reviewers/agent.ts +5 -5
  148. package/dist/templates/cc-native/_cc-native/{lib-ts → plan-review/lib}/reviewers/base/base-agent.ts +4 -4
  149. package/dist/templates/cc-native/_cc-native/{lib-ts → plan-review/lib}/reviewers/providers/claude-agent.ts +4 -4
  150. package/dist/templates/cc-native/_cc-native/{lib-ts → plan-review/lib}/reviewers/providers/codex-agent.ts +6 -6
  151. package/dist/templates/cc-native/_cc-native/{lib-ts → plan-review/lib}/reviewers/providers/gemini-agent.ts +1 -1
  152. package/dist/templates/cc-native/_cc-native/{lib-ts → plan-review/lib}/reviewers/providers/orchestrator-claude-agent.ts +4 -4
  153. package/dist/templates/cc-native/_cc-native/{lib-ts → plan-review/lib}/reviewers/types.ts +3 -3
  154. package/dist/templates/cc-native/_cc-native/{lib-ts → plan-review/lib}/verdict.ts +1 -1
  155. package/oclif.manifest.json +1 -1
  156. package/package.json +108 -108
  157. package/dist/templates/cc-native/_cc-native/lib-ts/artifacts.ts +0 -21
  158. package/dist/templates/cc-native/_cc-native/lib-ts/nul +0 -3
  159. /package/dist/templates/cc-native/_cc-native/{lib-ts/artifacts → artifacts/lib}/index.ts +0 -0
  160. /package/dist/templates/cc-native/_cc-native/{lib-ts/artifacts → artifacts/lib}/tracker.ts +0 -0
  161. /package/dist/templates/cc-native/_cc-native/{lib-ts → plan-review/lib}/reviewers/index.ts +0 -0
  162. /package/dist/templates/cc-native/_cc-native/{lib-ts → plan-review/lib}/reviewers/schemas.ts +0 -0
  163. /package/dist/templates/cc-native/_cc-native/{workflows → plan-review/workflows}/specdev.md +0 -0
@@ -1,208 +1,208 @@
1
- /**
2
- * Ollama HTTP client for local embeddings.
3
- *
4
- * Uses nomic-embed-text via Ollama's /api/embed endpoint.
5
- * Zero API cost, fast, private.
6
- */
7
-
8
- import { z } from "zod";
9
- import {
10
- OLLAMA_BASE_URL,
11
- OLLAMA_EMBED_MODEL,
12
- EMBED_DIMENSIONS,
13
- HYDE_OLLAMA_MODEL,
14
- } from "./types.js";
15
- import { logDebug, logError } from "./logger.js";
16
-
17
- const HOOK_NAME = "rlm_ollama";
18
- const BATCH_SIZE = 32;
19
-
20
- // Zod schemas for runtime validation
21
- const OllamaTagsResponseSchema = z.object({
22
- models: z.array(z.object({ name: z.string() })).optional(),
23
- });
24
-
25
- const OllamaEmbedResponseSchema = z.object({
26
- embeddings: z.array(z.array(z.number())),
27
- });
28
-
29
- export interface OllamaConfig {
30
- baseUrl: string;
31
- model: string;
32
- dimensions: number;
33
- }
34
-
35
- const DEFAULT_CONFIG: OllamaConfig = {
36
- baseUrl: OLLAMA_BASE_URL,
37
- model: OLLAMA_EMBED_MODEL,
38
- dimensions: EMBED_DIMENSIONS,
39
- };
40
-
41
- export interface HealthResult {
42
- ok: boolean;
43
- error?: string;
44
- }
45
-
46
- /**
47
- * Check if Ollama is running and the embedding model is available.
48
- */
49
- export async function checkOllamaHealth(
50
- config: Partial<OllamaConfig> = {},
51
- ): Promise<HealthResult> {
52
- const cfg = { ...DEFAULT_CONFIG, ...config };
53
- try {
54
- const resp = await fetch(`${cfg.baseUrl}/api/tags`, {
55
- signal: AbortSignal.timeout(5_000),
56
- });
57
- if (!resp.ok) {
58
- return { ok: false, error: `Ollama responded with ${resp.status}` };
59
- }
60
- const json = await resp.json();
61
- const parseResult = OllamaTagsResponseSchema.safeParse(json);
62
- if (!parseResult.success) {
63
- return { ok: false, error: `Invalid Ollama API response: ${parseResult.error.message}` };
64
- }
65
- const models = parseResult.data.models ?? [];
66
- const found = models.some(
67
- (m) => m.name === cfg.model || m.name.startsWith(`${cfg.model}:`),
68
- );
69
- if (!found) {
70
- const available = models.map((m) => m.name).join(", ") || "none";
71
- return {
72
- ok: false,
73
- error: `Model "${cfg.model}" not found. Available: ${available}. Run: ollama pull ${cfg.model}`,
74
- };
75
- }
76
- return { ok: true };
77
- } catch (e: unknown) {
78
- const msg = e instanceof Error ? e.message : String(e);
79
- return {
80
- ok: false,
81
- error: `Cannot reach Ollama at ${cfg.baseUrl}: ${msg}. Is Ollama running?`,
82
- };
83
- }
84
- }
85
-
86
- /**
87
- * Embed multiple texts via Ollama /api/embed.
88
- * Batches at BATCH_SIZE (Ollama processes sequentially internally).
89
- * Returns one Float32Array per input text.
90
- */
91
- export async function embed(
92
- texts: string[],
93
- config: Partial<OllamaConfig> = {},
94
- ): Promise<Float32Array[]> {
95
- const cfg = { ...DEFAULT_CONFIG, ...config };
96
- const results: Float32Array[] = [];
97
-
98
- for (let i = 0; i < texts.length; i += BATCH_SIZE) {
99
- const batch = texts.slice(i, i + BATCH_SIZE);
100
- logDebug(HOOK_NAME, `Embedding batch ${i / BATCH_SIZE + 1} (${batch.length} texts)`);
101
-
102
- const resp = await fetch(`${cfg.baseUrl}/api/embed`, {
103
- method: "POST",
104
- headers: { "Content-Type": "application/json" },
105
- body: JSON.stringify({ model: cfg.model, input: batch }),
106
- signal: AbortSignal.timeout(30_000),
107
- });
108
-
109
- if (!resp.ok) {
110
- const body = await resp.text().catch(() => "");
111
- throw new Error(`Ollama embed failed (${resp.status}): ${body}`);
112
- }
113
-
114
- const json = await resp.json();
115
- const parseResult = OllamaEmbedResponseSchema.safeParse(json);
116
- if (!parseResult.success) {
117
- throw new Error(`Invalid Ollama embed response: ${parseResult.error.message}`);
118
- }
119
-
120
- const data = parseResult.data;
121
- if (data.embeddings.length !== batch.length) {
122
- throw new Error(
123
- `Expected ${batch.length} embeddings, got ${data.embeddings.length}`,
124
- );
125
- }
126
-
127
- for (const vec of data.embeddings) {
128
- results.push(new Float32Array(vec));
129
- }
130
- }
131
-
132
- return results;
133
- }
134
-
135
- /**
136
- * Embed a single text. Convenience wrapper around embed().
137
- */
138
- export async function embedOne(
139
- text: string,
140
- config: Partial<OllamaConfig> = {},
141
- ): Promise<Float32Array> {
142
- const results = await embed([text], config);
143
- if (results.length === 0) {
144
- throw new Error("Embedding failed: received empty result array");
145
- }
146
- return results[0];
147
- }
148
-
149
- /**
150
- * Generate text using Ollama's /api/generate endpoint.
151
- * Follows same pattern as embed()/embedOne() for consistency.
152
- */
153
- export async function generateText(
154
- prompt: string,
155
- options?: {
156
- systemPrompt?: string;
157
- temperature?: number;
158
- maxTokens?: number;
159
- timeout?: number;
160
- model?: string;
161
- },
162
- ): Promise<{ success: boolean; text: string; error?: string; latency_ms: number }> {
163
- const startTime = Date.now();
164
- const model = options?.model ?? HYDE_OLLAMA_MODEL;
165
- const baseUrl = process.env.OLLAMA_BASE_URL ?? OLLAMA_BASE_URL;
166
-
167
- try {
168
- const response = await fetch(`${baseUrl}/api/generate`, {
169
- method: "POST",
170
- headers: { "Content-Type": "application/json" },
171
- body: JSON.stringify({
172
- model,
173
- prompt: options?.systemPrompt
174
- ? `${options.systemPrompt}\n\n${prompt}`
175
- : prompt,
176
- stream: false, // Non-streaming for simplicity
177
- options: {
178
- temperature: options?.temperature ?? 0.7,
179
- num_predict: options?.maxTokens ?? 200,
180
- },
181
- }),
182
- signal: AbortSignal.timeout(options?.timeout ?? 10_000),
183
- });
184
-
185
- if (!response.ok) {
186
- return {
187
- success: false,
188
- text: "",
189
- error: `HTTP ${response.status}: ${response.statusText}`,
190
- latency_ms: Date.now() - startTime,
191
- };
192
- }
193
-
194
- const data = await response.json();
195
- return {
196
- success: true,
197
- text: data.response || "",
198
- latency_ms: Date.now() - startTime,
199
- };
200
- } catch (e) {
201
- return {
202
- success: false,
203
- text: "",
204
- error: String(e),
205
- latency_ms: Date.now() - startTime,
206
- };
207
- }
208
- }
1
+ /**
2
+ * Ollama HTTP client for local embeddings.
3
+ *
4
+ * Uses nomic-embed-text via Ollama's /api/embed endpoint.
5
+ * Zero API cost, fast, private.
6
+ */
7
+
8
+ import { z } from "zod";
9
+ import {
10
+ OLLAMA_BASE_URL,
11
+ OLLAMA_EMBED_MODEL,
12
+ EMBED_DIMENSIONS,
13
+ HYDE_OLLAMA_MODEL,
14
+ } from "./types.js";
15
+ import { logDebug, logError } from "./logger.js";
16
+
17
+ const HOOK_NAME = "rlm_ollama";
18
+ const BATCH_SIZE = 32;
19
+
20
+ // Zod schemas for runtime validation
21
+ const OllamaTagsResponseSchema = z.object({
22
+ models: z.array(z.object({ name: z.string() })).optional(),
23
+ });
24
+
25
+ const OllamaEmbedResponseSchema = z.object({
26
+ embeddings: z.array(z.array(z.number())),
27
+ });
28
+
29
+ export interface OllamaConfig {
30
+ baseUrl: string;
31
+ model: string;
32
+ dimensions: number;
33
+ }
34
+
35
+ const DEFAULT_CONFIG: OllamaConfig = {
36
+ baseUrl: OLLAMA_BASE_URL,
37
+ model: OLLAMA_EMBED_MODEL,
38
+ dimensions: EMBED_DIMENSIONS,
39
+ };
40
+
41
+ export interface HealthResult {
42
+ ok: boolean;
43
+ error?: string;
44
+ }
45
+
46
+ /**
47
+ * Check if Ollama is running and the embedding model is available.
48
+ */
49
+ export async function checkOllamaHealth(
50
+ config: Partial<OllamaConfig> = {},
51
+ ): Promise<HealthResult> {
52
+ const cfg = { ...DEFAULT_CONFIG, ...config };
53
+ try {
54
+ const resp = await fetch(`${cfg.baseUrl}/api/tags`, {
55
+ signal: AbortSignal.timeout(5_000),
56
+ });
57
+ if (!resp.ok) {
58
+ return { ok: false, error: `Ollama responded with ${resp.status}` };
59
+ }
60
+ const json = await resp.json();
61
+ const parseResult = OllamaTagsResponseSchema.safeParse(json);
62
+ if (!parseResult.success) {
63
+ return { ok: false, error: `Invalid Ollama API response: ${parseResult.error.message}` };
64
+ }
65
+ const models = parseResult.data.models ?? [];
66
+ const found = models.some(
67
+ (m) => m.name === cfg.model || m.name.startsWith(`${cfg.model}:`),
68
+ );
69
+ if (!found) {
70
+ const available = models.map((m) => m.name).join(", ") || "none";
71
+ return {
72
+ ok: false,
73
+ error: `Model "${cfg.model}" not found. Available: ${available}. Run: ollama pull ${cfg.model}`,
74
+ };
75
+ }
76
+ return { ok: true };
77
+ } catch (e: unknown) {
78
+ const msg = e instanceof Error ? e.message : String(e);
79
+ return {
80
+ ok: false,
81
+ error: `Cannot reach Ollama at ${cfg.baseUrl}: ${msg}. Is Ollama running?`,
82
+ };
83
+ }
84
+ }
85
+
86
+ /**
87
+ * Embed multiple texts via Ollama /api/embed.
88
+ * Batches at BATCH_SIZE (Ollama processes sequentially internally).
89
+ * Returns one Float32Array per input text.
90
+ */
91
+ export async function embed(
92
+ texts: string[],
93
+ config: Partial<OllamaConfig> = {},
94
+ ): Promise<Float32Array[]> {
95
+ const cfg = { ...DEFAULT_CONFIG, ...config };
96
+ const results: Float32Array[] = [];
97
+
98
+ for (let i = 0; i < texts.length; i += BATCH_SIZE) {
99
+ const batch = texts.slice(i, i + BATCH_SIZE);
100
+ logDebug(HOOK_NAME, `Embedding batch ${i / BATCH_SIZE + 1} (${batch.length} texts)`);
101
+
102
+ const resp = await fetch(`${cfg.baseUrl}/api/embed`, {
103
+ method: "POST",
104
+ headers: { "Content-Type": "application/json" },
105
+ body: JSON.stringify({ model: cfg.model, input: batch }),
106
+ signal: AbortSignal.timeout(30_000),
107
+ });
108
+
109
+ if (!resp.ok) {
110
+ const body = await resp.text().catch(() => "");
111
+ throw new Error(`Ollama embed failed (${resp.status}): ${body}`);
112
+ }
113
+
114
+ const json = await resp.json();
115
+ const parseResult = OllamaEmbedResponseSchema.safeParse(json);
116
+ if (!parseResult.success) {
117
+ throw new Error(`Invalid Ollama embed response: ${parseResult.error.message}`);
118
+ }
119
+
120
+ const data = parseResult.data;
121
+ if (data.embeddings.length !== batch.length) {
122
+ throw new Error(
123
+ `Expected ${batch.length} embeddings, got ${data.embeddings.length}`,
124
+ );
125
+ }
126
+
127
+ for (const vec of data.embeddings) {
128
+ results.push(new Float32Array(vec));
129
+ }
130
+ }
131
+
132
+ return results;
133
+ }
134
+
135
+ /**
136
+ * Embed a single text. Convenience wrapper around embed().
137
+ */
138
+ export async function embedOne(
139
+ text: string,
140
+ config: Partial<OllamaConfig> = {},
141
+ ): Promise<Float32Array> {
142
+ const results = await embed([text], config);
143
+ if (results.length === 0) {
144
+ throw new Error("Embedding failed: received empty result array");
145
+ }
146
+ return results[0];
147
+ }
148
+
149
+ /**
150
+ * Generate text using Ollama's /api/generate endpoint.
151
+ * Follows same pattern as embed()/embedOne() for consistency.
152
+ */
153
+ export async function generateText(
154
+ prompt: string,
155
+ options?: {
156
+ systemPrompt?: string;
157
+ temperature?: number;
158
+ maxTokens?: number;
159
+ timeout?: number;
160
+ model?: string;
161
+ },
162
+ ): Promise<{ success: boolean; text: string; error?: string; latency_ms: number }> {
163
+ const startTime = Date.now();
164
+ const model = options?.model ?? HYDE_OLLAMA_MODEL;
165
+ const baseUrl = process.env.OLLAMA_BASE_URL ?? OLLAMA_BASE_URL;
166
+
167
+ try {
168
+ const response = await fetch(`${baseUrl}/api/generate`, {
169
+ method: "POST",
170
+ headers: { "Content-Type": "application/json" },
171
+ body: JSON.stringify({
172
+ model,
173
+ prompt: options?.systemPrompt
174
+ ? `${options.systemPrompt}\n\n${prompt}`
175
+ : prompt,
176
+ stream: false, // Non-streaming for simplicity
177
+ options: {
178
+ temperature: options?.temperature ?? 0.7,
179
+ num_predict: options?.maxTokens ?? 200,
180
+ },
181
+ }),
182
+ signal: AbortSignal.timeout(options?.timeout ?? 10_000),
183
+ });
184
+
185
+ if (!response.ok) {
186
+ return {
187
+ success: false,
188
+ text: "",
189
+ error: `HTTP ${response.status}: ${response.statusText}`,
190
+ latency_ms: Date.now() - startTime,
191
+ };
192
+ }
193
+
194
+ const data = await response.json();
195
+ return {
196
+ success: true,
197
+ text: data.response || "",
198
+ latency_ms: Date.now() - startTime,
199
+ };
200
+ } catch (e) {
201
+ return {
202
+ success: false,
203
+ text: "",
204
+ error: String(e),
205
+ latency_ms: Date.now() - startTime,
206
+ };
207
+ }
208
+ }