@badliveware/pi-model-catalog 0.1.1 → 0.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
package/CHANGELOG.md ADDED
@@ -0,0 +1,11 @@
1
+ # Changelog
2
+
3
+ ## 0.2.0
4
+
5
+ - Expose per-model supported Pi thinking levels in `list_pi_models` output and details.
6
+ - Shorten repeated `list_pi_models` output caveats and keep detailed interpretation guidance in the tool prompt guidelines.
7
+ - Update package imports and peer dependencies for the `@earendil-works/*` Pi packages.
8
+
9
+ ## 0.1.1
10
+
11
+ - Initial public package release for Pi model catalog inspection.
package/README.md CHANGED
@@ -2,7 +2,7 @@
2
2
 
3
3
  Adds a `list_pi_models` tool that lets agents inspect Pi's current model registry before choosing or recommending a model.
4
4
 
5
- Use it when model choice should depend on what is actually available in your Pi setup: auth status, local support notes, enabled/cycling preferences, context size, capabilities, quota guidance, and optional price data.
5
+ Use it when model choice should depend on what is actually available in your Pi setup: auth status, local support notes, enabled/cycling preferences, context size, capabilities, supported thinking levels, quota guidance, and optional price data.
6
6
 
7
7
  ## Install
8
8
 
@@ -39,10 +39,11 @@ Default output is intentionally compact:
39
39
  - `auth`, `support`, and `enabled` status
40
40
  - context and max output tokens
41
41
  - capability marker: `text`, `think`, `img`, or `think+img`
42
+ - supported Pi thinking levels, shown as `off`, `min`, `low`, `med`, `high`, and `xhi` in the compact table
42
43
  - price tier and rough relative cost
43
44
  - quota/scarcity guidance
44
45
 
45
- Pass `includeDetails: true` for verbose use/avoid guidance. Pass `includePricing: true` for numeric input/output prices and relative ratios.
46
+ Pass `includeDetails: true` for verbose use/avoid guidance and full thinking level names. Pass `includePricing: true` for numeric input/output prices and relative ratios. Structured tool details include `thinkingLevels` and any model-specific `thinkingLevelMap`; Pi uses `off` for provider no/none thinking.
46
47
 
47
48
  ## Tool parameters
48
49
 
package/catalog.ts ADDED
@@ -0,0 +1,447 @@
1
+ import * as fs from "node:fs";
2
+ import * as os from "node:os";
3
+ import * as path from "node:path";
4
+ import { getSupportedThinkingLevels, type Api, type Model } from "@earendil-works/pi-ai";
5
+ import type { ExtensionContext } from "@earendil-works/pi-coding-agent";
6
+
7
+ export type UnsupportedMode = "exclude" | "include" | "only";
8
+
9
+ export interface ListPiModelsParams {
10
+ query?: string;
11
+ includeUnavailable?: boolean;
12
+ includeDetails?: boolean;
13
+ includePricing?: boolean;
14
+ relativeTo?: string;
15
+ unsupported?: UnsupportedMode;
16
+ }
17
+
18
+ interface ModelCatalogSettings {
19
+ enabledModels?: string[];
20
+ }
21
+
22
+ interface ModelCatalogConfig {
23
+ unsupportedModels?: Array<string | { model?: string; fullId?: string; reason?: string }>;
24
+ }
25
+
26
+ interface UnsupportedModelInfo {
27
+ reason: string;
28
+ }
29
+
30
+ interface ModelPricing {
31
+ inputPerMillion: number;
32
+ outputPerMillion: number;
33
+ cacheReadPerMillion: number;
34
+ cacheWritePerMillion: number;
35
+ known: boolean;
36
+ relativeTo?: string;
37
+ relativeInput?: number;
38
+ relativeOutput?: number;
39
+ relativeCacheRead?: number;
40
+ relativeBlended?: number;
41
+ }
42
+
43
+ interface ModelCatalogRow {
44
+ provider: string;
45
+ model: string;
46
+ fullId: string;
47
+ current: boolean;
48
+ available: boolean;
49
+ cycleEnabled: boolean;
50
+ context: string;
51
+ maxOut: string;
52
+ thinking: string;
53
+ thinkingLevels: string[];
54
+ thinkingLevelMap?: Partial<Record<string, string | null>>;
55
+ images: string;
56
+ cost: string;
57
+ quota: string;
58
+ pricing: ModelPricing;
59
+ supported: boolean;
60
+ unsupportedReason?: string;
61
+ useFor: string;
62
+ avoidFor: string;
63
+ }
64
+
65
+ interface ModelCatalogResult {
66
+ rows: ModelCatalogRow[];
67
+ excludedUnsupportedRows: ModelCatalogRow[];
68
+ pricingBaseline?: string;
69
+ pricingBaselineMissing?: string;
70
+ }
71
+
72
+ function agentDir(): string {
73
+ return process.env.PI_CODING_AGENT_DIR ?? process.env.PI_AGENT_DIR ?? path.join(os.homedir(), ".pi", "agent");
74
+ }
75
+
76
+ function readSettings(): ModelCatalogSettings {
77
+ try {
78
+ const settingsPath = path.join(agentDir(), "settings.json");
79
+ const parsed = JSON.parse(fs.readFileSync(settingsPath, "utf-8")) as ModelCatalogSettings;
80
+ return parsed && typeof parsed === "object" ? parsed : {};
81
+ } catch {
82
+ return {};
83
+ }
84
+ }
85
+
86
+ function readModelCatalogConfig(): ModelCatalogConfig {
87
+ try {
88
+ const configPath = path.join(agentDir(), "model-catalog.json");
89
+ const parsed = JSON.parse(fs.readFileSync(configPath, "utf-8")) as ModelCatalogConfig;
90
+ return parsed && typeof parsed === "object" ? parsed : {};
91
+ } catch {
92
+ return {};
93
+ }
94
+ }
95
+
96
+ function formatTokenCount(count: number): string {
97
+ if (count >= 1_000_000) {
98
+ const millions = count / 1_000_000;
99
+ return millions % 1 === 0 ? `${millions}M` : `${millions.toFixed(1)}M`;
100
+ }
101
+ if (count >= 1_000) {
102
+ const thousands = count / 1_000;
103
+ return thousands % 1 === 0 ? `${thousands}K` : `${thousands.toFixed(1)}K`;
104
+ }
105
+ return count.toString();
106
+ }
107
+
108
+ function formatPricePerMillion(value: number, known: boolean): string {
109
+ if (!known) return "—";
110
+ if (value === 0) return "$0";
111
+ return `$${value < 1 ? value.toFixed(3) : value.toFixed(2)}`;
112
+ }
113
+
114
+ function formatRatio(value: number | undefined): string {
115
+ if (value === undefined || !Number.isFinite(value)) return "—";
116
+ return `${value.toFixed(2)}×`;
117
+ }
118
+
119
+ function formatCapabilities(row: ModelCatalogRow): string {
120
+ const caps: string[] = [];
121
+ if (row.thinking === "yes") caps.push("think");
122
+ if (row.images === "yes") caps.push("img");
123
+ return caps.length > 0 ? caps.join("+") : "text";
124
+ }
125
+
126
+ function formatThinkingLevels(levels: string[]): string {
127
+ const labels: Record<string, string> = {
128
+ off: "off",
129
+ minimal: "min",
130
+ low: "low",
131
+ medium: "med",
132
+ high: "high",
133
+ xhigh: "xhi",
134
+ };
135
+ return levels.map((level) => labels[level] ?? level).join(",") || "—";
136
+ }
137
+
138
+ function shellWords(input: string): string[] {
139
+ const words: string[] = [];
140
+ let current = "";
141
+ let quote: '"' | "'" | undefined;
142
+ let escaping = false;
143
+ for (const char of input) {
144
+ if (escaping) {
145
+ current += char;
146
+ escaping = false;
147
+ continue;
148
+ }
149
+ if (char === "\\" && quote !== "'") {
150
+ escaping = true;
151
+ continue;
152
+ }
153
+ if ((char === '"' || char === "'") && (!quote || quote === char)) {
154
+ quote = quote ? undefined : char;
155
+ continue;
156
+ }
157
+ if (!quote && /\s/.test(char)) {
158
+ if (current) words.push(current);
159
+ current = "";
160
+ continue;
161
+ }
162
+ current += char;
163
+ }
164
+ if (current) words.push(current);
165
+ return words;
166
+ }
167
+
168
+ export function parseModelsGuideArgs(args: string): Pick<ListPiModelsParams, "query" | "includeDetails" | "includePricing" | "relativeTo"> {
169
+ const queryParts: string[] = [];
170
+ let includeDetails = false;
171
+ let includePricing = false;
172
+ let relativeTo: string | undefined;
173
+ const words = shellWords(args);
174
+ for (let index = 0; index < words.length; index += 1) {
175
+ const word = words[index];
176
+ if (word === "--verbose" || word === "--details" || word === "-v") {
177
+ includeDetails = true;
178
+ continue;
179
+ }
180
+ if (word === "--pricing" || word === "--prices" || word === "-p") {
181
+ includePricing = true;
182
+ continue;
183
+ }
184
+ if (word === "--relative-to" || word === "--relative" || word === "--baseline") {
185
+ relativeTo = words[index + 1];
186
+ index += 1;
187
+ continue;
188
+ }
189
+ const relativeMatch = word.match(/^--(?:relative-to|relative|baseline)=(.+)$/);
190
+ if (relativeMatch) {
191
+ relativeTo = relativeMatch[1];
192
+ continue;
193
+ }
194
+ queryParts.push(word);
195
+ }
196
+ return {
197
+ query: queryParts.join(" ") || undefined,
198
+ includeDetails,
199
+ includePricing,
200
+ relativeTo,
201
+ };
202
+ }
203
+
204
+ function matchesModel(model: Model<Api>, query: string | undefined): boolean {
205
+ if (!query?.trim()) return true;
206
+ const needle = query.trim().toLowerCase();
207
+ return `${model.provider} ${model.id} ${model.name}`.toLowerCase().includes(needle);
208
+ }
209
+
210
+ function isSparkModel(model: Model<Api>): boolean {
211
+ return /(?:^|[-_])spark(?:$|[-_])/.test(model.id.toLowerCase());
212
+ }
213
+
214
+ function isLocalModel(model: Model<Api>): boolean {
215
+ const provider = String(model.provider).toLowerCase();
216
+ return provider.startsWith("local-") || provider.includes("llamaswap");
217
+ }
218
+
219
+ function classifyCost(model: Model<Api>): string {
220
+ if (isLocalModel(model)) return "free/local";
221
+ if (isSparkModel(model)) return "premium-speed";
222
+ const cost = model.cost;
223
+ const output = cost?.output ?? 0;
224
+ const input = cost?.input ?? 0;
225
+ const blended = input + output;
226
+ if (blended <= 0) return "unknown/sub";
227
+ if (blended <= 1) return "low";
228
+ if (blended <= 8) return "medium";
229
+ if (blended <= 30) return "high";
230
+ return "premium";
231
+ }
232
+
233
+ function classifyQuota(model: Model<Api>): string {
234
+ const id = model.id.toLowerCase();
235
+ const provider = String(model.provider).toLowerCase();
236
+ if (isLocalModel(model)) return "local-serial";
237
+ if (isSparkModel(model)) return "very-fast";
238
+ if (/mini|flash|lite|haiku|small/.test(id)) return "fast/limited";
239
+ if (/opus|pro|gpt-5\.5|o3|sonnet|grok-4/.test(id)) return "scarce";
240
+ if (provider.includes("codex") || provider.includes("copilot")) return "subscription";
241
+ return "standard";
242
+ }
243
+
244
+ function modelProfile(model: Model<Api>): "local" | "latency" | "fast" | "standard" | "strong" {
245
+ const id = model.id.toLowerCase();
246
+ if (isLocalModel(model)) return "local";
247
+ if (isSparkModel(model)) return "latency";
248
+ if (/mini|flash|lite|haiku|small/.test(id)) return "fast";
249
+ if (/opus|pro|gpt-5\.5|gpt-5\.4(?!-mini)|o3|sonnet|grok-4/.test(id)) return "strong";
250
+ return "standard";
251
+ }
252
+
253
+ function usageGuidance(model: Model<Api>): Pick<ModelCatalogRow, "useFor" | "avoidFor"> {
254
+ const profile = modelProfile(model);
255
+ if (profile === "local") {
256
+ return {
257
+ useFor: "local background work when latency is acceptable, concurrency is low, and the configured model's capability is sufficient",
258
+ avoidFor: "interactive work, latency-sensitive tasks, tasks above the configured local model's capability, final review, or parallel/concurrent local-model tasks unless explicitly chosen",
259
+ };
260
+ }
261
+ if (profile === "latency") {
262
+ return {
263
+ useFor: "latency-critical bounded tasks and quick scouts when very high speed is worth premium cost",
264
+ avoidFor: "cheap routine delegation, bulk mechanical work, cost-sensitive tasks, risky architecture, final review",
265
+ };
266
+ }
267
+ if (profile === "fast") {
268
+ return {
269
+ useFor: "routine edits, search, summaries, tests, bounded subagent tasks when low cost or lower scarcity matters",
270
+ avoidFor: "risky architecture, subtle debugging, final review of high-impact changes",
271
+ };
272
+ }
273
+ if (profile === "strong") {
274
+ return {
275
+ useFor: "hard reasoning, risky refactors, architecture, adversarial review",
276
+ avoidFor: "mechanical searches or easy-to-verify chores when faster models suffice",
277
+ };
278
+ }
279
+ return {
280
+ useFor: "default implementation, debugging, review, moderate planning",
281
+ avoidFor: "very mechanical chores if a faster model is available; highest-risk work if a stronger model is available",
282
+ };
283
+ }
284
+
285
+ function unsupportedModels(): Map<string, UnsupportedModelInfo> {
286
+ const unsupported = new Map<string, UnsupportedModelInfo>();
287
+ for (const entry of readModelCatalogConfig().unsupportedModels ?? []) {
288
+ if (typeof entry === "string") {
289
+ unsupported.set(entry, { reason: "marked unsupported in model-catalog.json" });
290
+ continue;
291
+ }
292
+ const fullId = entry.fullId ?? entry.model;
293
+ if (!fullId) continue;
294
+ unsupported.set(fullId, { reason: entry.reason ?? "marked unsupported in model-catalog.json" });
295
+ }
296
+ return unsupported;
297
+ }
298
+
299
+ function findModelById(ctx: ExtensionContext, id: string | undefined): Model<Api> | undefined {
300
+ const needle = id?.trim();
301
+ if (!needle) return undefined;
302
+ for (const model of ctx.modelRegistry.getAll()) {
303
+ const fullId = `${model.provider}/${model.id}`;
304
+ if (fullId === needle || model.id === needle) return model;
305
+ }
306
+ return undefined;
307
+ }
308
+
309
+ function hasKnownPricing(model: Model<Api>): boolean {
310
+ return isLocalModel(model) || model.cost.input > 0 || model.cost.output > 0 || model.cost.cacheRead > 0 || model.cost.cacheWrite > 0;
311
+ }
312
+
313
+ function pricingForModel(model: Model<Api>, baseline: Model<Api> | undefined): ModelPricing {
314
+ const known = hasKnownPricing(model);
315
+ const baselineKnown = baseline ? hasKnownPricing(baseline) : false;
316
+ const baselineCost = baselineKnown ? baseline?.cost : undefined;
317
+ const modelBlend = model.cost.input + model.cost.output;
318
+ const baselineBlend = baselineCost ? baselineCost.input + baselineCost.output : 0;
319
+ return {
320
+ inputPerMillion: model.cost.input,
321
+ outputPerMillion: model.cost.output,
322
+ cacheReadPerMillion: model.cost.cacheRead,
323
+ cacheWritePerMillion: model.cost.cacheWrite,
324
+ known,
325
+ relativeTo: baseline && baselineKnown ? `${baseline.provider}/${baseline.id}` : undefined,
326
+ relativeInput: known && baselineCost && baselineCost.input > 0 ? model.cost.input / baselineCost.input : undefined,
327
+ relativeOutput: known && baselineCost && baselineCost.output > 0 ? model.cost.output / baselineCost.output : undefined,
328
+ relativeCacheRead: known && baselineCost && baselineCost.cacheRead > 0 ? model.cost.cacheRead / baselineCost.cacheRead : undefined,
329
+ relativeBlended: known && baselineCost && baselineBlend > 0 ? modelBlend / baselineBlend : undefined,
330
+ };
331
+ }
332
+
333
+ export function toRows(ctx: ExtensionContext, includeUnavailable: boolean, unsupportedMode: UnsupportedMode, query?: string, relativeTo?: string): ModelCatalogResult {
334
+ const availableIds = new Set(ctx.modelRegistry.getAvailable().map((model) => `${model.provider}/${model.id}`));
335
+ const enabledIds = new Set(readSettings().enabledModels ?? []);
336
+ const unsupportedById = unsupportedModels();
337
+ const models = includeUnavailable ? ctx.modelRegistry.getAll() : ctx.modelRegistry.getAvailable();
338
+ const requestedBaselineId = relativeTo?.trim();
339
+ const requestedBaseline = findModelById(ctx, requestedBaselineId);
340
+ const baseline = requestedBaselineId ? requestedBaseline : ctx.model;
341
+ const pricingBaseline = baseline && hasKnownPricing(baseline) ? `${baseline.provider}/${baseline.id}` : undefined;
342
+ const pricingBaselineMissing = requestedBaselineId && !pricingBaseline ? requestedBaselineId : undefined;
343
+ const allRows = models
344
+ .filter((model) => matchesModel(model, query))
345
+ .sort((a, b) => {
346
+ const providerCmp = String(a.provider).localeCompare(String(b.provider));
347
+ return providerCmp || a.id.localeCompare(b.id);
348
+ })
349
+ .map((model) => {
350
+ const fullId = `${model.provider}/${model.id}`;
351
+ const guidance = usageGuidance(model);
352
+ const unsupported = unsupportedById.get(fullId);
353
+ const thinkingLevels = getSupportedThinkingLevels(model);
354
+ return {
355
+ provider: String(model.provider),
356
+ model: model.id,
357
+ fullId,
358
+ current: ctx.model ? ctx.model.provider === model.provider && ctx.model.id === model.id : false,
359
+ available: availableIds.has(fullId),
360
+ cycleEnabled: enabledIds.has(fullId),
361
+ context: formatTokenCount(model.contextWindow),
362
+ maxOut: formatTokenCount(model.maxTokens),
363
+ thinking: model.reasoning ? "yes" : "no",
364
+ thinkingLevels,
365
+ thinkingLevelMap: model.thinkingLevelMap ? { ...model.thinkingLevelMap } : undefined,
366
+ images: model.input.includes("image") ? "yes" : "no",
367
+ cost: classifyCost(model),
368
+ quota: classifyQuota(model),
369
+ pricing: pricingForModel(model, baseline),
370
+ supported: unsupported === undefined,
371
+ unsupportedReason: unsupported?.reason,
372
+ useFor: guidance.useFor,
373
+ avoidFor: guidance.avoidFor,
374
+ };
375
+ });
376
+ const excludedUnsupportedRows = allRows.filter((row) => !row.supported);
377
+ const rows = unsupportedMode === "only"
378
+ ? excludedUnsupportedRows
379
+ : unsupportedMode === "include"
380
+ ? allRows
381
+ : allRows.filter((row) => row.supported);
382
+ return { rows, excludedUnsupportedRows, pricingBaseline, pricingBaselineMissing };
383
+ }
384
+
385
+ export function table(result: ModelCatalogResult, includeDetails: boolean, unsupportedMode: UnsupportedMode, includePricing: boolean): string {
386
+ const rows = result.rows;
387
+ if (rows.length === 0) return result.excludedUnsupportedRows.length > 0 ? "No matching supported models. Call with unsupported: 'include' to show locally unsupported matches." : "No matching models.";
388
+ const headers = includePricing
389
+ ? ["model", "auth", "support", "enabled", "ctx", "out", "caps", "think-levels", "price-tier", "quota", "in$/M", "out$/M", "rel-in", "rel-out", "rel-blend"]
390
+ : ["model", "auth", "support", "enabled", "ctx", "out", "caps", "think-levels", "price-tier", "rel-cost", "quota"];
391
+ const body = rows.map((row) => {
392
+ const cells = [
393
+ `${row.current ? "*" : ""}${row.fullId}`,
394
+ row.available ? "yes" : "no",
395
+ row.supported ? "yes" : "no",
396
+ row.cycleEnabled ? "yes" : "no",
397
+ row.context,
398
+ row.maxOut,
399
+ formatCapabilities(row),
400
+ formatThinkingLevels(row.thinkingLevels),
401
+ row.cost,
402
+ ];
403
+ if (!includePricing) {
404
+ cells.push(formatRatio(row.pricing.relativeBlended));
405
+ }
406
+ cells.push(row.quota);
407
+ if (includePricing) {
408
+ cells.push(
409
+ formatPricePerMillion(row.pricing.inputPerMillion, row.pricing.known),
410
+ formatPricePerMillion(row.pricing.outputPerMillion, row.pricing.known),
411
+ formatRatio(row.pricing.relativeInput),
412
+ formatRatio(row.pricing.relativeOutput),
413
+ formatRatio(row.pricing.relativeBlended),
414
+ );
415
+ }
416
+ return cells;
417
+ });
418
+ const widths = headers.map((header, index) => Math.max(header.length, ...body.map((cells) => cells[index].length)));
419
+ const lines = [headers.map((header, index) => header.padEnd(widths[index])).join(" ")];
420
+ for (const cells of body) {
421
+ lines.push(cells.map((cell, index) => cell.padEnd(widths[index])).join(" "));
422
+ }
423
+ if (result.pricingBaseline) {
424
+ lines.push("", includePricing
425
+ ? `Pricing: $/M; rel-* ratios compare against ${result.pricingBaseline}.`
426
+ : `rel-cost: rough local-registry cost vs ${result.pricingBaseline}; pass relativeTo to choose a different baseline.`);
427
+ } else if (result.pricingBaselineMissing) {
428
+ lines.push("", `Pricing: baseline '${result.pricingBaselineMissing}' was not found or lacks numeric pricing.`);
429
+ } else if (includePricing) {
430
+ lines.push("", "Pricing: $/M. Pass relativeTo: 'provider/model-id' to include ratios.");
431
+ }
432
+ if (includeDetails) {
433
+ lines.push("", "Usage guidance:");
434
+ for (const row of rows) {
435
+ const support = row.supported ? "" : ` Unsupported locally: ${row.unsupportedReason}.`;
436
+ const pricing = includePricing
437
+ ? ` Pricing: input ${formatPricePerMillion(row.pricing.inputPerMillion, row.pricing.known)}/M, output ${formatPricePerMillion(row.pricing.outputPerMillion, row.pricing.known)}/M${row.pricing.relativeTo ? `, relative to ${row.pricing.relativeTo}: input ${formatRatio(row.pricing.relativeInput)}, output ${formatRatio(row.pricing.relativeOutput)}, blended ${formatRatio(row.pricing.relativeBlended)}` : ""}.`
438
+ : "";
439
+ lines.push(`- ${row.fullId}: thinking levels ${row.thinkingLevels.join(", ") || "none"}; use for ${row.useFor}; avoid for ${row.avoidFor}.${pricing}${support}`);
440
+ }
441
+ }
442
+ if (unsupportedMode === "exclude" && result.excludedUnsupportedRows.length > 0) {
443
+ lines.push("", `Excluded ${result.excludedUnsupportedRows.length} unsupported model(s); pass unsupported: 'include' to show them.`);
444
+ }
445
+ lines.push("", "Legend: think-levels use Pi abbreviations; price/quota/support are local guidance, not live guarantees.");
446
+ return lines.join("\n");
447
+ }
package/index.ts CHANGED
@@ -1,434 +1,7 @@
1
- import * as fs from "node:fs";
2
- import * as os from "node:os";
3
- import * as path from "node:path";
4
- import type { Api, Model } from "@mariozechner/pi-ai";
5
- import type { ExtensionAPI, ExtensionContext } from "@mariozechner/pi-coding-agent";
1
+ import type { ExtensionAPI, ExtensionContext } from "@earendil-works/pi-coding-agent";
6
2
  // @ts-ignore The Pi extension runtime provides typebox, but this package does not ship declarations in current Pi installs.
7
3
  import { Type } from "typebox";
8
-
9
- type UnsupportedMode = "exclude" | "include" | "only";
10
-
11
- interface ListPiModelsParams {
12
- query?: string;
13
- includeUnavailable?: boolean;
14
- includeDetails?: boolean;
15
- includePricing?: boolean;
16
- relativeTo?: string;
17
- unsupported?: UnsupportedMode;
18
- }
19
-
20
- interface ModelCatalogSettings {
21
- enabledModels?: string[];
22
- }
23
-
24
- interface ModelCatalogConfig {
25
- unsupportedModels?: Array<string | { model?: string; fullId?: string; reason?: string }>;
26
- }
27
-
28
- interface UnsupportedModelInfo {
29
- reason: string;
30
- }
31
-
32
- interface ModelPricing {
33
- inputPerMillion: number;
34
- outputPerMillion: number;
35
- cacheReadPerMillion: number;
36
- cacheWritePerMillion: number;
37
- known: boolean;
38
- relativeTo?: string;
39
- relativeInput?: number;
40
- relativeOutput?: number;
41
- relativeCacheRead?: number;
42
- relativeBlended?: number;
43
- }
44
-
45
- interface ModelCatalogRow {
46
- provider: string;
47
- model: string;
48
- fullId: string;
49
- current: boolean;
50
- available: boolean;
51
- cycleEnabled: boolean;
52
- context: string;
53
- maxOut: string;
54
- thinking: string;
55
- images: string;
56
- cost: string;
57
- quota: string;
58
- pricing: ModelPricing;
59
- supported: boolean;
60
- unsupportedReason?: string;
61
- useFor: string;
62
- avoidFor: string;
63
- }
64
-
65
- interface ModelCatalogResult {
66
- rows: ModelCatalogRow[];
67
- excludedUnsupportedRows: ModelCatalogRow[];
68
- pricingBaseline?: string;
69
- pricingBaselineMissing?: string;
70
- }
71
-
72
- function agentDir(): string {
73
- return process.env.PI_CODING_AGENT_DIR ?? process.env.PI_AGENT_DIR ?? path.join(os.homedir(), ".pi", "agent");
74
- }
75
-
76
- function readSettings(): ModelCatalogSettings {
77
- try {
78
- const settingsPath = path.join(agentDir(), "settings.json");
79
- const parsed = JSON.parse(fs.readFileSync(settingsPath, "utf-8")) as ModelCatalogSettings;
80
- return parsed && typeof parsed === "object" ? parsed : {};
81
- } catch {
82
- return {};
83
- }
84
- }
85
-
86
- function readModelCatalogConfig(): ModelCatalogConfig {
87
- try {
88
- const configPath = path.join(agentDir(), "model-catalog.json");
89
- const parsed = JSON.parse(fs.readFileSync(configPath, "utf-8")) as ModelCatalogConfig;
90
- return parsed && typeof parsed === "object" ? parsed : {};
91
- } catch {
92
- return {};
93
- }
94
- }
95
-
96
- function formatTokenCount(count: number): string {
97
- if (count >= 1_000_000) {
98
- const millions = count / 1_000_000;
99
- return millions % 1 === 0 ? `${millions}M` : `${millions.toFixed(1)}M`;
100
- }
101
- if (count >= 1_000) {
102
- const thousands = count / 1_000;
103
- return thousands % 1 === 0 ? `${thousands}K` : `${thousands.toFixed(1)}K`;
104
- }
105
- return count.toString();
106
- }
107
-
108
- function formatPricePerMillion(value: number, known: boolean): string {
109
- if (!known) return "—";
110
- if (value === 0) return "$0";
111
- return `$${value < 1 ? value.toFixed(3) : value.toFixed(2)}`;
112
- }
113
-
114
- function formatRatio(value: number | undefined): string {
115
- if (value === undefined || !Number.isFinite(value)) return "—";
116
- return `${value.toFixed(2)}×`;
117
- }
118
-
119
- function formatCapabilities(row: ModelCatalogRow): string {
120
- const caps: string[] = [];
121
- if (row.thinking === "yes") caps.push("think");
122
- if (row.images === "yes") caps.push("img");
123
- return caps.length > 0 ? caps.join("+") : "text";
124
- }
125
-
126
- function shellWords(input: string): string[] {
127
- const words: string[] = [];
128
- let current = "";
129
- let quote: '"' | "'" | undefined;
130
- let escaping = false;
131
- for (const char of input) {
132
- if (escaping) {
133
- current += char;
134
- escaping = false;
135
- continue;
136
- }
137
- if (char === "\\" && quote !== "'") {
138
- escaping = true;
139
- continue;
140
- }
141
- if ((char === '"' || char === "'") && (!quote || quote === char)) {
142
- quote = quote ? undefined : char;
143
- continue;
144
- }
145
- if (!quote && /\s/.test(char)) {
146
- if (current) words.push(current);
147
- current = "";
148
- continue;
149
- }
150
- current += char;
151
- }
152
- if (current) words.push(current);
153
- return words;
154
- }
155
-
156
- function parseModelsGuideArgs(args: string): Pick<ListPiModelsParams, "query" | "includeDetails" | "includePricing" | "relativeTo"> {
157
- const queryParts: string[] = [];
158
- let includeDetails = false;
159
- let includePricing = false;
160
- let relativeTo: string | undefined;
161
- const words = shellWords(args);
162
- for (let index = 0; index < words.length; index += 1) {
163
- const word = words[index];
164
- if (word === "--verbose" || word === "--details" || word === "-v") {
165
- includeDetails = true;
166
- continue;
167
- }
168
- if (word === "--pricing" || word === "--prices" || word === "-p") {
169
- includePricing = true;
170
- continue;
171
- }
172
- if (word === "--relative-to" || word === "--relative" || word === "--baseline") {
173
- relativeTo = words[index + 1];
174
- index += 1;
175
- continue;
176
- }
177
- const relativeMatch = word.match(/^--(?:relative-to|relative|baseline)=(.+)$/);
178
- if (relativeMatch) {
179
- relativeTo = relativeMatch[1];
180
- continue;
181
- }
182
- queryParts.push(word);
183
- }
184
- return {
185
- query: queryParts.join(" ") || undefined,
186
- includeDetails,
187
- includePricing,
188
- relativeTo,
189
- };
190
- }
191
-
192
- function matchesModel(model: Model<Api>, query: string | undefined): boolean {
193
- if (!query?.trim()) return true;
194
- const needle = query.trim().toLowerCase();
195
- return `${model.provider} ${model.id} ${model.name}`.toLowerCase().includes(needle);
196
- }
197
-
198
- function isSparkModel(model: Model<Api>): boolean {
199
- return /(?:^|[-_])spark(?:$|[-_])/.test(model.id.toLowerCase());
200
- }
201
-
202
- function isLocalModel(model: Model<Api>): boolean {
203
- const provider = String(model.provider).toLowerCase();
204
- return provider.startsWith("local-") || provider.includes("llamaswap");
205
- }
206
-
207
- function classifyCost(model: Model<Api>): string {
208
- if (isLocalModel(model)) return "free/local";
209
- if (isSparkModel(model)) return "premium-speed";
210
- const cost = model.cost;
211
- const output = cost?.output ?? 0;
212
- const input = cost?.input ?? 0;
213
- const blended = input + output;
214
- if (blended <= 0) return "unknown/sub";
215
- if (blended <= 1) return "low";
216
- if (blended <= 8) return "medium";
217
- if (blended <= 30) return "high";
218
- return "premium";
219
- }
220
-
221
- function classifyQuota(model: Model<Api>): string {
222
- const id = model.id.toLowerCase();
223
- const provider = String(model.provider).toLowerCase();
224
- if (isLocalModel(model)) return "local-serial";
225
- if (isSparkModel(model)) return "very-fast";
226
- if (/mini|flash|lite|haiku|small/.test(id)) return "fast/limited";
227
- if (/opus|pro|gpt-5\.5|o3|sonnet|grok-4/.test(id)) return "scarce";
228
- if (provider.includes("codex") || provider.includes("copilot")) return "subscription";
229
- return "standard";
230
- }
231
-
232
- function modelProfile(model: Model<Api>): "local" | "latency" | "fast" | "standard" | "strong" {
233
- const id = model.id.toLowerCase();
234
- if (isLocalModel(model)) return "local";
235
- if (isSparkModel(model)) return "latency";
236
- if (/mini|flash|lite|haiku|small/.test(id)) return "fast";
237
- if (/opus|pro|gpt-5\.5|gpt-5\.4(?!-mini)|o3|sonnet|grok-4/.test(id)) return "strong";
238
- return "standard";
239
- }
240
-
241
- function usageGuidance(model: Model<Api>): Pick<ModelCatalogRow, "useFor" | "avoidFor"> {
242
- const profile = modelProfile(model);
243
- if (profile === "local") {
244
- return {
245
- useFor: "local background work when latency is acceptable, concurrency is low, and the configured model's capability is sufficient",
246
- avoidFor: "interactive work, latency-sensitive tasks, tasks above the configured local model's capability, final review, or parallel/concurrent local-model tasks unless explicitly chosen",
247
- };
248
- }
249
- if (profile === "latency") {
250
- return {
251
- useFor: "latency-critical bounded tasks and quick scouts when very high speed is worth premium cost",
252
- avoidFor: "cheap routine delegation, bulk mechanical work, cost-sensitive tasks, risky architecture, final review",
253
- };
254
- }
255
- if (profile === "fast") {
256
- return {
257
- useFor: "routine edits, search, summaries, tests, bounded subagent tasks when low cost or lower scarcity matters",
258
- avoidFor: "risky architecture, subtle debugging, final review of high-impact changes",
259
- };
260
- }
261
- if (profile === "strong") {
262
- return {
263
- useFor: "hard reasoning, risky refactors, architecture, adversarial review",
264
- avoidFor: "mechanical searches or easy-to-verify chores when faster models suffice",
265
- };
266
- }
267
- return {
268
- useFor: "default implementation, debugging, review, moderate planning",
269
- avoidFor: "very mechanical chores if a faster model is available; highest-risk work if a stronger model is available",
270
- };
271
- }
272
-
273
- function unsupportedModels(): Map<string, UnsupportedModelInfo> {
274
- const unsupported = new Map<string, UnsupportedModelInfo>();
275
- for (const entry of readModelCatalogConfig().unsupportedModels ?? []) {
276
- if (typeof entry === "string") {
277
- unsupported.set(entry, { reason: "marked unsupported in model-catalog.json" });
278
- continue;
279
- }
280
- const fullId = entry.fullId ?? entry.model;
281
- if (!fullId) continue;
282
- unsupported.set(fullId, { reason: entry.reason ?? "marked unsupported in model-catalog.json" });
283
- }
284
- return unsupported;
285
- }
286
-
287
- function findModelById(ctx: ExtensionContext, id: string | undefined): Model<Api> | undefined {
288
- const needle = id?.trim();
289
- if (!needle) return undefined;
290
- for (const model of ctx.modelRegistry.getAll()) {
291
- const fullId = `${model.provider}/${model.id}`;
292
- if (fullId === needle || model.id === needle) return model;
293
- }
294
- return undefined;
295
- }
296
-
297
- function hasKnownPricing(model: Model<Api>): boolean {
298
- return isLocalModel(model) || model.cost.input > 0 || model.cost.output > 0 || model.cost.cacheRead > 0 || model.cost.cacheWrite > 0;
299
- }
300
-
301
- function pricingForModel(model: Model<Api>, baseline: Model<Api> | undefined): ModelPricing {
302
- const known = hasKnownPricing(model);
303
- const baselineKnown = baseline ? hasKnownPricing(baseline) : false;
304
- const baselineCost = baselineKnown ? baseline?.cost : undefined;
305
- const modelBlend = model.cost.input + model.cost.output;
306
- const baselineBlend = baselineCost ? baselineCost.input + baselineCost.output : 0;
307
- return {
308
- inputPerMillion: model.cost.input,
309
- outputPerMillion: model.cost.output,
310
- cacheReadPerMillion: model.cost.cacheRead,
311
- cacheWritePerMillion: model.cost.cacheWrite,
312
- known,
313
- relativeTo: baseline && baselineKnown ? `${baseline.provider}/${baseline.id}` : undefined,
314
- relativeInput: known && baselineCost && baselineCost.input > 0 ? model.cost.input / baselineCost.input : undefined,
315
- relativeOutput: known && baselineCost && baselineCost.output > 0 ? model.cost.output / baselineCost.output : undefined,
316
- relativeCacheRead: known && baselineCost && baselineCost.cacheRead > 0 ? model.cost.cacheRead / baselineCost.cacheRead : undefined,
317
- relativeBlended: known && baselineCost && baselineBlend > 0 ? modelBlend / baselineBlend : undefined,
318
- };
319
- }
320
-
321
- function toRows(ctx: ExtensionContext, includeUnavailable: boolean, unsupportedMode: UnsupportedMode, query?: string, relativeTo?: string): ModelCatalogResult {
322
- const availableIds = new Set(ctx.modelRegistry.getAvailable().map((model) => `${model.provider}/${model.id}`));
323
- const enabledIds = new Set(readSettings().enabledModels ?? []);
324
- const unsupportedById = unsupportedModels();
325
- const models = includeUnavailable ? ctx.modelRegistry.getAll() : ctx.modelRegistry.getAvailable();
326
- const requestedBaselineId = relativeTo?.trim();
327
- const requestedBaseline = findModelById(ctx, requestedBaselineId);
328
- const baseline = requestedBaselineId ? requestedBaseline : ctx.model;
329
- const pricingBaseline = baseline && hasKnownPricing(baseline) ? `${baseline.provider}/${baseline.id}` : undefined;
330
- const pricingBaselineMissing = requestedBaselineId && !pricingBaseline ? requestedBaselineId : undefined;
331
- const allRows = models
332
- .filter((model) => matchesModel(model, query))
333
- .sort((a, b) => {
334
- const providerCmp = String(a.provider).localeCompare(String(b.provider));
335
- return providerCmp || a.id.localeCompare(b.id);
336
- })
337
- .map((model) => {
338
- const fullId = `${model.provider}/${model.id}`;
339
- const guidance = usageGuidance(model);
340
- const unsupported = unsupportedById.get(fullId);
341
- return {
342
- provider: String(model.provider),
343
- model: model.id,
344
- fullId,
345
- current: ctx.model ? ctx.model.provider === model.provider && ctx.model.id === model.id : false,
346
- available: availableIds.has(fullId),
347
- cycleEnabled: enabledIds.has(fullId),
348
- context: formatTokenCount(model.contextWindow),
349
- maxOut: formatTokenCount(model.maxTokens),
350
- thinking: model.reasoning ? "yes" : "no",
351
- images: model.input.includes("image") ? "yes" : "no",
352
- cost: classifyCost(model),
353
- quota: classifyQuota(model),
354
- pricing: pricingForModel(model, baseline),
355
- supported: unsupported === undefined,
356
- unsupportedReason: unsupported?.reason,
357
- useFor: guidance.useFor,
358
- avoidFor: guidance.avoidFor,
359
- };
360
- });
361
- const excludedUnsupportedRows = allRows.filter((row) => !row.supported);
362
- const rows = unsupportedMode === "only"
363
- ? excludedUnsupportedRows
364
- : unsupportedMode === "include"
365
- ? allRows
366
- : allRows.filter((row) => row.supported);
367
- return { rows, excludedUnsupportedRows, pricingBaseline, pricingBaselineMissing };
368
- }
369
-
370
- function table(result: ModelCatalogResult, includeDetails: boolean, unsupportedMode: UnsupportedMode, includePricing: boolean): string {
371
- const rows = result.rows;
372
- if (rows.length === 0) return result.excludedUnsupportedRows.length > 0 ? "No matching supported models. Call with unsupported: 'include' to show locally unsupported matches." : "No matching models.";
373
- const headers = includePricing
374
- ? ["model", "auth", "support", "enabled", "ctx", "out", "caps", "price-tier", "quota", "in$/M", "out$/M", "rel-in", "rel-out", "rel-blend"]
375
- : ["model", "auth", "support", "enabled", "ctx", "out", "caps", "price-tier", "rel-cost", "quota"];
376
- const body = rows.map((row) => {
377
- const cells = [
378
- `${row.current ? "*" : ""}${row.fullId}`,
379
- row.available ? "yes" : "no",
380
- row.supported ? "yes" : "no",
381
- row.cycleEnabled ? "yes" : "no",
382
- row.context,
383
- row.maxOut,
384
- formatCapabilities(row),
385
- row.cost,
386
- ];
387
- if (!includePricing) {
388
- cells.push(formatRatio(row.pricing.relativeBlended));
389
- }
390
- cells.push(row.quota);
391
- if (includePricing) {
392
- cells.push(
393
- formatPricePerMillion(row.pricing.inputPerMillion, row.pricing.known),
394
- formatPricePerMillion(row.pricing.outputPerMillion, row.pricing.known),
395
- formatRatio(row.pricing.relativeInput),
396
- formatRatio(row.pricing.relativeOutput),
397
- formatRatio(row.pricing.relativeBlended),
398
- );
399
- }
400
- return cells;
401
- });
402
- const widths = headers.map((header, index) => Math.max(header.length, ...body.map((cells) => cells[index].length)));
403
- const lines = [headers.map((header, index) => header.padEnd(widths[index])).join(" ")];
404
- for (const cells of body) {
405
- lines.push(cells.map((cell, index) => cell.padEnd(widths[index])).join(" "));
406
- }
407
- if (result.pricingBaseline) {
408
- lines.push("", includePricing
409
- ? `Pricing: $/million tokens. Relative columns compare against ${result.pricingBaseline}; rel-blend uses input+output rates as a rough 1:1 token-mix weight.`
410
- : `rel-cost compares input+output rates against ${result.pricingBaseline}; pass relativeTo/--relative-to to choose a different baseline.`);
411
- } else if (result.pricingBaselineMissing) {
412
- lines.push("", `Pricing: relative baseline '${result.pricingBaselineMissing}' was not found or has no numeric pricing.`);
413
- } else if (includePricing) {
414
- lines.push("", "Pricing: $/million tokens. Pass relativeTo: 'provider/model-id' to include relative cost ratios.");
415
- }
416
- if (includeDetails) {
417
- lines.push("", "Usage guidance:");
418
- for (const row of rows) {
419
- const support = row.supported ? "" : ` Unsupported locally: ${row.unsupportedReason}.`;
420
- const pricing = includePricing
421
- ? ` Pricing: input ${formatPricePerMillion(row.pricing.inputPerMillion, row.pricing.known)}/M, output ${formatPricePerMillion(row.pricing.outputPerMillion, row.pricing.known)}/M${row.pricing.relativeTo ? `, relative to ${row.pricing.relativeTo}: input ${formatRatio(row.pricing.relativeInput)}, output ${formatRatio(row.pricing.relativeOutput)}, blended ${formatRatio(row.pricing.relativeBlended)}` : ""}.`
422
- : "";
423
- lines.push(`- ${row.fullId}: use for ${row.useFor}; avoid for ${row.avoidFor}.${pricing}${support}`);
424
- }
425
- }
426
- if (unsupportedMode === "exclude" && result.excludedUnsupportedRows.length > 0) {
427
- lines.push("", `Excluded ${result.excludedUnsupportedRows.length} locally unsupported model(s). Call with unsupported: 'include' to show them.`);
428
- }
429
- lines.push("", "Notes: price-tier uses input+output $/million-token rates from Pi's local model registry: low ≤ $1, medium ≤ $8, high ≤ $30, premium > $30; local models are free/local and spark models are premium-speed. Local models are usually free from API billing but can be slow and effectively serial/concurrency-constrained: avoid using multiple local models or many same-local-model tasks at once unless your local backend supports it. Numeric prices may be nominal weights for subscription-backed providers. Zero/blank pricing outside free/local can mean unknown, bundled, or non-metered rather than free. Quota is guidance, not live remaining quota. Support is a local compatibility hint, not provider live availability.");
430
- return lines.join("\n");
431
- }
4
+ import { parseModelsGuideArgs, table, toRows, type ListPiModelsParams, type UnsupportedMode } from "./catalog.ts";
432
5
 
433
6
  const listPiModelsParameters = Type.Object({
434
7
  query: Type.Optional(Type.String({ description: "Optional substring filter, e.g. 'mini', 'codex', 'sonnet'." })),
@@ -447,21 +20,23 @@ export default function modelCatalog(pi: ExtensionAPI): void {
447
20
  pi.registerTool({
448
21
  name: "list_pi_models",
449
22
  label: "List Pi Models",
450
- description: "List available Pi models with concise decision fields by default, plus optional verbose guidance and numeric pricing.",
451
- promptSnippet: "List/query Pi models, model-selection guidance, and optional pricing.",
23
+ description: "List available Pi models with concise decision fields by default, plus supported thinking levels, optional verbose guidance, and numeric pricing.",
24
+ promptSnippet: "List/query Pi models, supported thinking levels, model-selection guidance, and optional pricing.",
452
25
  promptGuidelines: [
453
- "Use list_pi_models before choosing or recommending a model when current model availability, local support status, cost, quota, or capability matters.",
26
+ "Use list_pi_models before choosing or recommending a model when current model availability, local support status, cost, quota, thinking levels, or capability matters.",
454
27
  "For model overrides, choose rows with support yes and enabled yes unless the user explicitly authorizes configuration changes; auth yes alone only means credentials exist.",
455
28
  "list_pi_models excludes locally unsupported models by default; use unsupported: 'include' or 'only' only for diagnostics.",
456
- "list_pi_models price-tier/quota fields are guidance tiers, not live remaining quota.",
29
+ "Interpret list_pi_models fields as local guidance: support is local compatibility, quota is not live remaining quota, numeric pricing can be nominal/unknown, and rel-cost/rel-blend are rough local-registry ratios.",
30
+ "list_pi_models thinking levels are Pi names: off means provider no/none thinking when supported, and compact table abbreviations min/med/xhi mean minimal/medium/xhigh.",
31
+ "Treat local/free models as potentially slow or serial unless the local backend is known to support concurrent use; spark models are premium-speed, not cheap/mini substitutes.",
457
32
  "Default output is intentionally concise; request includeDetails: true only when use/avoid prose would materially help selection.",
458
- "When precise cost comparisons matter, pass includePricing: true and relativeTo: 'provider/model-id'. Treat numeric prices as local registry data, not guaranteed live billing for subscription-backed providers.",
33
+ "When precise cost comparisons matter, pass includePricing: true and relativeTo: 'provider/model-id'.",
459
34
  ],
460
35
  parameters: listPiModelsParameters,
461
36
  async execute(_toolCallId: string, params: ListPiModelsParams, _signal: AbortSignal | undefined, _onUpdate: unknown, ctx: ExtensionContext) {
462
37
  const includeUnavailable = params.includeUnavailable === true;
463
38
  const includeDetails = params.includeDetails === true;
464
- const unsupportedMode = params.unsupported ?? "exclude";
39
+ const unsupportedMode: UnsupportedMode = params.unsupported ?? "exclude";
465
40
  const includePricing = params.includePricing === true;
466
41
  const result = toRows(ctx, includeUnavailable, unsupportedMode, params.query, params.relativeTo);
467
42
  return {
@@ -475,7 +50,7 @@ export default function modelCatalog(pi: ExtensionAPI): void {
475
50
  });
476
51
 
477
52
  pi.registerCommand("models-guide", {
478
- description: "Show available Pi models with concise defaults. Use --verbose for details, or --pricing and --relative-to provider/model-id for numeric ratios.",
53
+ description: "Show available Pi models and supported thinking levels with concise defaults. Use --verbose for details, or --pricing and --relative-to provider/model-id for numeric ratios.",
479
54
  handler: async (args: string, ctx: ExtensionContext) => {
480
55
  const parsed = parseModelsGuideArgs(args);
481
56
  const result = toRows(ctx, false, "exclude", parsed.query, parsed.relativeTo);
package/package.json CHANGED
@@ -1,6 +1,6 @@
1
1
  {
2
2
  "name": "@badliveware/pi-model-catalog",
3
- "version": "0.1.1",
3
+ "version": "0.2.0",
4
4
  "description": "Expose Pi model listings and selection guidance as an agent tool.",
5
5
  "type": "module",
6
6
  "keywords": [
@@ -24,8 +24,10 @@
24
24
  },
25
25
  "files": [
26
26
  "README.md",
27
+ "CHANGELOG.md",
27
28
  "LICENSE",
28
29
  "index.ts",
30
+ "catalog.ts",
29
31
  "package.json"
30
32
  ],
31
33
  "pi": {
@@ -34,8 +36,8 @@
34
36
  ]
35
37
  },
36
38
  "peerDependencies": {
37
- "@mariozechner/pi-ai": "*",
38
- "@mariozechner/pi-coding-agent": "*",
39
+ "@earendil-works/pi-ai": "*",
40
+ "@earendil-works/pi-coding-agent": "*",
39
41
  "typebox": "*"
40
42
  },
41
43
  "engines": {