npm - pi-ui-extend - Versions diffs - 0.1.24 → 0.1.26 - Mend

pi-ui-extend 0.1.24 → 0.1.26

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (17) hide show

package/dist/app/input/autocomplete-controller.js CHANGED Viewed

@@ -177,7 +177,6 @@ export async function completeInputWithPi(runtime, draft, config, signal) {
             maxTokens: requestModel.maxTokens,
             ...(parsedModel.thinkingLevel && parsedModel.thinkingLevel !== "off" ? { reasoning: parsedModel.thinkingLevel } : {}),
             signal: requestSignal.signal,
-            temperature: 0.1,
             timeoutMs,
         });
         for await (const event of stream) {

package/dist/app/session/session-event-controller.js CHANGED Viewed

@@ -363,6 +363,9 @@ export class AppSessionEventController {
         }
         if (!this.assistantTextBuffer)
             return visibleText;
+        if (!final && shouldHoldAssistantStreamWhitespaceTail(this.assistantTextBuffer, this.hasVisibleAssistantText(visibleText))) {
+            return visibleText;
+        }
         if (shouldHoldAssistantStreamTail(this.assistantTextBuffer, this.hasVisibleAssistantText(visibleText))) {
             if (final)
                 this.assistantTextBuffer = "";
@@ -445,6 +448,9 @@ function shouldHoldAssistantStreamTail(text, hasVisibleText) {
         return !hasVisibleText;
     return isPotentialDcpMetadataLine(text);
 }
+function shouldHoldAssistantStreamWhitespaceTail(text, hasVisibleText) {
+    return hasVisibleText && text.trim().length === 0;
+}
 function isHiddenMarkdownMetadataLine(line) {
     return isMarkdownReferenceDefinition(line) || isPotentialDcpMetadataLine(line);
 }

package/dist/app/session/tabs-controller.d.ts CHANGED Viewed

@@ -41,8 +41,10 @@ export declare class AppTabsController {
     private readonly runtimeLoadsByTabId;
     private readonly runtimeSubscriptionsByTabId;
     private readonly runtimeRefreshTimersByTabId;
+    private readonly historyReloadTimersByTabId;
     private readonly inputStatesByTabId;
     private readonly deferredUserMessagesByTabId;
+    private readonly tabIdsNeedingHistoryReload;
     private activeTabId;
     private pendingActiveTabId;
     private historyLoadGeneration;
@@ -89,6 +91,9 @@ export declare class AppTabsController {
     private shouldScheduleDelayedSyncForRuntimeEvent;
     private scheduleDelayedRuntimeSync;
     private clearRuntimeRefreshTimers;
+    private clearHistoryReloadTimers;
+    private scheduleDelayedHistoryReload;
+    private reloadActiveTabHistoryIfNeeded;
     private syncTabFromObservedRuntime;
     private storeActiveInputState;
     private storeActiveDeferredUserMessages;

package/dist/app/session/tabs-controller.js CHANGED Viewed

@@ -20,8 +20,10 @@ export class AppTabsController {
     runtimeLoadsByTabId = new Map();
     runtimeSubscriptionsByTabId = new Map();
     runtimeRefreshTimersByTabId = new Map();
+    historyReloadTimersByTabId = new Map();
     inputStatesByTabId = new Map();
     deferredUserMessagesByTabId = new Map();
+    tabIdsNeedingHistoryReload = new Set();
     activeTabId;
     pendingActiveTabId;
     historyLoadGeneration = 0;
@@ -632,6 +634,7 @@ export class AppTabsController {
         void this.saveTabs();
         this.scheduleTabPrewarm();
         await this.loadActiveSessionHistory(targetRuntime);
+        this.scheduleDelayedHistoryReload(target.id, targetRuntime);
     }
     async closeTab(tabId) {
         if (this.pendingActiveTabId) {
@@ -814,6 +817,8 @@ export class AppTabsController {
         this.runtimesByTabId.delete(tabId);
         this.runtimeLoadsByTabId.delete(tabId);
         this.clearRuntimeRefreshTimers(tabId);
+        this.clearHistoryReloadTimers(tabId);
+        this.tabIdsNeedingHistoryReload.delete(tabId);
         const subscription = this.runtimeSubscriptionsByTabId.get(tabId);
         subscription?.unsubscribe();
         this.runtimeSubscriptionsByTabId.delete(tabId);
@@ -822,6 +827,9 @@ export class AppTabsController {
         for (const tabId of this.runtimeRefreshTimersByTabId.keys()) {
             this.clearRuntimeRefreshTimers(tabId);
         }
+        for (const tabId of this.historyReloadTimersByTabId.keys()) {
+            this.clearHistoryReloadTimers(tabId);
+        }
         for (const subscription of this.runtimeSubscriptionsByTabId.values()) {
             subscription.unsubscribe();
         }
@@ -835,6 +843,7 @@ export class AppTabsController {
         const unsubscribe = runtime.session.subscribe((event) => {
             if (this.shouldScheduleDelayedSyncForRuntimeEvent(event)) {
                 this.scheduleDelayedRuntimeSync(tabId, runtime);
+                this.tabIdsNeedingHistoryReload.add(tabId);
             }
             if (!this.shouldSyncTabFromRuntimeEvent(event))
                 return;
@@ -878,6 +887,44 @@ export class AppTabsController {
             clearTimeout(timer);
         this.runtimeRefreshTimersByTabId.delete(tabId);
     }
+    clearHistoryReloadTimers(tabId) {
+        const timers = this.historyReloadTimersByTabId.get(tabId);
+        if (!timers)
+            return;
+        for (const timer of timers)
+            clearTimeout(timer);
+        this.historyReloadTimersByTabId.delete(tabId);
+    }
+    scheduleDelayedHistoryReload(tabId, runtime) {
+        if (!this.tabIdsNeedingHistoryReload.has(tabId))
+            return;
+        if (tabId !== this.activeTabId || this.pendingActiveTabId !== undefined)
+            return;
+        this.clearHistoryReloadTimers(tabId);
+        for (const delayMs of [150, 1000, 3000]) {
+            const timer = setTimeout(() => {
+                this.historyReloadTimersByTabId.get(tabId)?.delete(timer);
+                void this.reloadActiveTabHistoryIfNeeded(tabId, runtime, delayMs === 3000);
+            }, delayMs);
+            timer.unref?.();
+            let timers = this.historyReloadTimersByTabId.get(tabId);
+            if (!timers) {
+                timers = new Set();
+                this.historyReloadTimersByTabId.set(tabId, timers);
+            }
+            timers.add(timer);
+        }
+    }
+    async reloadActiveTabHistoryIfNeeded(tabId, runtime, finalAttempt) {
+        if (tabId !== this.activeTabId || this.pendingActiveTabId !== undefined || this.host.runtime() !== runtime)
+            return;
+        if (!this.tabIdsNeedingHistoryReload.has(tabId))
+            return;
+        await this.loadActiveSessionHistory(runtime);
+        if (finalAttempt && tabId === this.activeTabId && this.host.runtime() === runtime) {
+            this.tabIdsNeedingHistoryReload.delete(tabId);
+        }
+    }
     syncTabFromObservedRuntime(tabId, runtime) {
         const tab = this.tabItems.find((item) => item.id === tabId);
         if (!tab) {

package/dist/schemas/pi-tools-suite-schema.d.ts CHANGED Viewed

@@ -83,7 +83,6 @@ export declare const PiToolsSuiteConfigSchema: Type.TObject<{
             maxTaskChars: Type.TOptional<Type.TNumber>;
             maxTokens: Type.TOptional<Type.TNumber>;
             maxRetries: Type.TOptional<Type.TNumber>;
-            temperature: Type.TOptional<Type.TNumber>;
             timeoutMs: Type.TOptional<Type.TNumber>;
             debug: Type.TOptional<Type.TBoolean>;
         }>>;

package/dist/schemas/pi-tools-suite-schema.js CHANGED Viewed

@@ -115,7 +115,6 @@ const SubagentRoutingConfig = Type.Object({
     maxTaskChars: Type.Optional(Type.Number({ description: "Max task/scope characters sent to router.", minimum: 100 })),
     maxTokens: Type.Optional(Type.Number({ description: "Max router response tokens.", minimum: 8 })),
     maxRetries: Type.Optional(Type.Number({ description: "Router request retries.", minimum: 0 })),
-    temperature: Type.Optional(Type.Number({ description: "Router sampling temperature.", minimum: 0, maximum: 2 })),
     timeoutMs: Type.Optional(Type.Number({ description: "Router request timeout in ms.", minimum: 1000 })),
     debug: Type.Optional(Type.Boolean({ description: "Show routing debug warnings." })),
 }, { description: "LLM-based role routing configuration." });

package/extensions/session-title/config.ts CHANGED Viewed

@@ -12,7 +12,6 @@ export interface SessionTitleConfig {
 	maxRetries: number;
 	generationAttempts: number;
 	retryDelayMs: number;
-	temperature: number;
 	timeoutMs: number;
 	terminalTitle: boolean;
 	terminalTitlePrefix: string;
@@ -29,7 +28,6 @@ const DEFAULT_CONFIG: SessionTitleConfig = {
 	maxRetries: 2,
 	generationAttempts: 3,
 	retryDelayMs: 3000,
-	temperature: 0.2,
 	timeoutMs: 12_000,
 	terminalTitle: true,
 	terminalTitlePrefix: "pi — ",
@@ -83,9 +81,6 @@ function mergeConfig(base: SessionTitleConfig, raw: Record<string, unknown>): Se
 	if (typeof raw.retryDelayMs === "number" && Number.isFinite(raw.retryDelayMs)) {
 		next.retryDelayMs = Math.max(250, Math.floor(raw.retryDelayMs));
 	}
-	if (typeof raw.temperature === "number" && Number.isFinite(raw.temperature)) {
-		next.temperature = Math.min(2, Math.max(0, raw.temperature));
-	}
 	if (typeof raw.timeoutMs === "number" && Number.isFinite(raw.timeoutMs)) {
 		next.timeoutMs = Math.max(1000, Math.floor(raw.timeoutMs));
 	}

package/extensions/session-title/index.ts CHANGED Viewed

@@ -221,7 +221,6 @@ async function generateSessionTitle(
 			maxRetries: config.maxRetries,
 			maxTokens: config.maxTokens,
 			signal,
-			temperature: config.temperature,
 			timeoutMs: config.timeoutMs,
 		},
 	);

package/external/pi-tools-suite/README.md CHANGED Viewed

@@ -163,7 +163,7 @@ Async-subagents also injects a lightweight oh-my-openagent-style system-prompt s
 When the parent model cannot inspect images, async-subagents adds vision-delegation guidance and can save current-turn image attachments under `.pi/subagents/attachments/` so a `vision` sub-agent can receive them as `imagePaths`. Dynamic provider capabilities can be missing or stale after switching models, so blind parent models can still be configured explicitly with case-insensitive `*` masks under `asyncSubagents.vision.blindModelPatterns` in `~/.config/pi/pi-tools-suite.jsonc`. GLM is no longer treated as blind by async-subagents by default; the main-session `glm-coding-discipline` lookup tool is the preferred path for GLM visual lookups.
-When a task omits `subagentType`, async-subagents asks a lightweight router model to choose one configured type for each task from the task text/scope and the `types.<name>.description` metadata. Explicit task `subagentType` still wins. Keep type descriptions short, literal, and distinct because they are inserted into the router prompt for a small model. Router settings live under `asyncSubagents.routing` (`enabled`, `model`, `maxTaskChars`, `maxTokens`, `maxRetries`, `temperature`, `timeoutMs`, `debug`); the default router model is `zai/glm-4.5-air`. If the router is disabled, unavailable, aborted, or returns invalid JSON, omitted types fall back to `defaultType`.
+When a task omits `subagentType`, async-subagents asks a lightweight router model to choose one configured type for each task from the task text/scope and the `types.<name>.description` metadata. Explicit task `subagentType` still wins. Keep type descriptions short, literal, and distinct because they are inserted into the router prompt for a small model. Router settings live under `asyncSubagents.routing` (`enabled`, `model`, `maxTaskChars`, `maxTokens`, `maxRetries`, `timeoutMs`, `debug`); the default router model is `zai/glm-4.5-air`. If the router is disabled, unavailable, aborted, or returns invalid JSON, omitted types fall back to `defaultType`.
 Define optional `presets` under `asyncSubagents` in `~/.config/pi/pi-tools-suite.jsonc`, `$PI_CONFIG_DIR/pi-tools-suite.jsonc`, or project `.pi/pi-tools-suite.jsonc`, then use `/subagent-preset` or `/subagent-preset-config` to pick one persistent active preset for future spawns across all sessions. Set `AGENTS_PRESET=<name>` before launching Pi to override the saved preset for only the current process/session without changing the saved selection. If Pi is already running, use `/subagent-preset session <name>` for the same process-only override, and `/subagent-preset session-clear` to remove that runtime override. The TUI only selects presets already present in config; it does not edit JSON. If no `asyncSubagents` section exists, run `/subagent-preset init` to insert the bundled sample from `src/async-subagents/async-subagents.sample.jsonc` into the shared config (or to copy a standalone override file when `ASYNC_SUBAGENTS_CONFIG` / `PI_SUBAGENTS_CONFIG` is set). Existing config sections/files are never overwritten. Presets select an agent/model configuration: they can provide global fallback `model`/`thinking`/`extraArgs` and per-role overrides under `asyncSubagents.presets.<name>.types.<subagentType>`. They can also provide ordered `fallbackModels` globally or per-role; when a sub-agent fails with quota/rate-limit errors such as 429, async-subagents immediately tries the next fallback model and remembers the exhausted provider for the current Pi process/session, so later spawns skip that provider until Pi exits. This is intended for provider-level fallback chains such as `antigravity/* → openai-codex/* → zai/*` or `openai-codex/* → zai/*`; omit fallbacks for effectively unlimited providers. Antigravity account rotation has priority over preset fallback: async-subagents only falls back after Antigravity reports that all configured accounts are exhausted for that model. Explicit task model overrides and force-current-model disable preset fallback for that task. The active preset name is stored separately in `~/.pi/agent/subagent-preset-selection.json`.

package/external/pi-tools-suite/src/async-subagents/async-subagents.sample.jsonc CHANGED Viewed

@@ -58,7 +58,6 @@
     "maxTaskChars": 1200,
     "maxTokens": 512,
     "maxRetries": 1,
-    "temperature": 0,
     "timeoutMs": 12000,
     "debug": false
   },

package/external/pi-tools-suite/src/async-subagents/core/config.ts CHANGED Viewed

@@ -37,8 +37,6 @@ export interface SubagentRoutingConfig {
 	maxTokens?: number;
 	/** Router complete() retries. */
 	maxRetries?: number;
-	/** Router sampling temperature. */
-	temperature?: number;
 	/** Router request timeout. */
 	timeoutMs?: number;
 	/** Show best-effort UI warnings when routing falls back. */
@@ -150,7 +148,6 @@ export const DEFAULT_ROUTING_CONFIG: ResolvedSubagentRoutingConfig = {
 	maxTaskChars: 1200,
 	maxTokens: 512,
 	maxRetries: 1,
-	temperature: 0,
 	timeoutMs: 12_000,
 	debug: false,
 };
@@ -522,8 +519,6 @@ function normalizeRoutingConfig(value: Record<string, unknown>): SubagentRouting
 	if (maxTokens !== undefined) routing.maxTokens = Math.max(8, Math.round(maxTokens));
 	const maxRetries = finiteNumber(value.maxRetries);
 	if (maxRetries !== undefined) routing.maxRetries = Math.max(0, Math.round(maxRetries));
-	const temperature = finiteNumber(value.temperature);
-	if (temperature !== undefined) routing.temperature = Math.min(2, Math.max(0, temperature));
 	const timeoutMs = finiteNumber(value.timeoutMs);
 	if (timeoutMs !== undefined) routing.timeoutMs = Math.max(1000, Math.round(timeoutMs));
 	return routing;

package/external/pi-tools-suite/src/async-subagents/core/routing.ts CHANGED Viewed

@@ -80,7 +80,6 @@ export async function routeSubagentTasks(
 				maxRetries: routing.maxRetries,
 				maxTokens: routing.maxTokens,
 				signal,
-				temperature: routing.temperature,
 				timeoutMs: routing.timeoutMs,
 			},
 		);

package/external/pi-tools-suite/src/async-subagents/core/ultrawork-auto.ts CHANGED Viewed

@@ -82,7 +82,6 @@ export async function decideUltraworkAuto(
 				maxRetries: routing.maxRetries,
 				maxTokens: Math.min(routing.maxTokens, 32),
 				signal,
-				temperature: 0,
 				timeoutMs: routing.timeoutMs,
 			},
 		);

package/external/pi-tools-suite/src/default-pi-tools-suite-config.ts CHANGED Viewed

@@ -23,7 +23,7 @@ export const DEFAULT_PI_TOOLS_SUITE_CONFIG_JSONC = String.raw`{
   },
   "asyncSubagents": {
     "defaultType": "quick",
-    "routing": { "enabled": true, "model": "zai/glm-4.5-air", "maxTaskChars": 1200, "maxTokens": 512, "maxRetries": 1, "temperature": 0, "timeoutMs": 12000, "debug": false },
+    "routing": { "enabled": true, "model": "zai/glm-4.5-air", "maxTaskChars": 1200, "maxTokens": 512, "maxRetries": 1, "timeoutMs": 12000, "debug": false },
     "presets": {
       "cheap": {
         "description": "Use cheap GLM/Gemini Flash models for text/code roles; keep vision on the enabled GPT vision model.",

package/external/pi-tools-suite/src/glm-coding-discipline/index.ts CHANGED Viewed

@@ -40,6 +40,7 @@ const DEFAULT_LOOKUP_TIMEOUT_MS = 120_000;
 const MAX_IMAGE_BYTES = 16 * 1024 * 1024;
 const SILENCE_REMINDER_MIN_VIOLATION_GAP = 3;
 const SILENCE_REMINDER_MIN_MESSAGE_GAP = 12;
+const LOOKUP_TOOL_NAME = "lookup";
 const LOOKUP_TOOL_PARAMS = Type.Object(
 	{
@@ -187,16 +188,35 @@ export default function glmCodingDiscipline(pi: ExtensionAPI) {
 		pi.registerTool(createLookupTool());
 	}
+	function syncLookupToolAvailability(modelRef: string | undefined, cwd?: string): void {
+		const activeTools = typeof pi.getActiveTools === "function" ? pi.getActiveTools() : undefined;
+		if (!Array.isArray(activeTools)) return;
+		const lookupEnabled = Boolean(lookupModelFromConfig(cwd));
+		const shouldExposeLookup = lookupEnabled && isGlmModel(modelRef);
+		const hasLookup = activeTools.includes(LOOKUP_TOOL_NAME);
+		if (shouldExposeLookup === hasLookup) return;
+		if (typeof pi.setActiveTools !== "function") return;
+		const nextTools = shouldExposeLookup
+			? [...activeTools, LOOKUP_TOOL_NAME]
+			: activeTools.filter((tool: unknown) => tool !== LOOKUP_TOOL_NAME);
+		pi.setActiveTools([...new Set(nextTools)]);
+	}
 	maybeRegisterLookupTool(process.cwd());
 	pi.on("session_start", async (_event: unknown, ctx: unknown) => {
 		selectedModelRef = modelRefFromContext(ctx);
 		maybeRegisterLookupTool(contextCwd(ctx));
+		syncLookupToolAvailability(selectedModelRef, contextCwd(ctx));
 	});
 	pi.on("model_select", async (event: { model?: unknown }, ctx: unknown) => {
 		selectedModelRef = modelRefFromModel(event.model) ?? modelRefFromContext(ctx);
 		maybeRegisterLookupTool(contextCwd(ctx));
+		syncLookupToolAvailability(selectedModelRef, contextCwd(ctx));
 	});
 	pi.on("before_provider_request", async (event: { payload?: unknown }, ctx: unknown) => {
@@ -273,7 +293,7 @@ export function injectCodingDisciplineIntoPayload(payload: unknown, options: { l
 function createLookupTool() {
 	return {
-		name: "lookup",
+		name: LOOKUP_TOOL_NAME,
 		label: "Lookup",
 		description: [
 			"Ask the configured vision-capable lookup model to inspect recent image/screenshot context and answer a focused visual question.",

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "pi-ui-extend",
-  "version": "0.1.24",
+  "version": "0.1.26",
   "private": false,
   "type": "module",
   "bin": {

package/schemas/pi-tools-suite.json CHANGED Viewed

@@ -419,12 +419,6 @@
               "description": "Router request retries.",
               "minimum": 0
             },
-            "temperature": {
-              "type": "number",
-              "description": "Router sampling temperature.",
-              "minimum": 0,
-              "maximum": 2
-            },
             "timeoutMs": {
               "type": "number",
               "description": "Router request timeout in ms.",