npm - @visorcraft/idlehands - Versions diffs - 1.0.9 → 1.1.0 - Mend

@visorcraft/idlehands 1.0.9 → 1.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (21) hide show

package/README.md +19 -0
package/dist/agent.js +85 -3
package/dist/agent.js.map +1 -1
package/dist/cli/args.js +1 -0
package/dist/cli/args.js.map +1 -1
package/dist/cli/bot.js +5 -5
package/dist/cli/bot.js.map +1 -1
package/dist/cli/runtime-cmds.js +134 -12
package/dist/cli/runtime-cmds.js.map +1 -1
package/dist/cli/setup.js +15 -0
package/dist/cli/setup.js.map +1 -1
package/dist/client.js +168 -0
package/dist/client.js.map +1 -1
package/dist/history.js +1 -1
package/dist/index.js +86 -0
package/dist/index.js.map +1 -1
package/dist/spinner.js +8 -1
package/dist/spinner.js.map +1 -1
package/dist/tools.js +10 -2
package/dist/tools.js.map +1 -1
package/package.json +1 -1

package/README.md CHANGED Viewed

@@ -13,6 +13,7 @@ Idle Hands is built for people who want an agent that can actually ship work, no
 - **TUI-first UX** for real daily use (streaming output, slash commands, approvals)
 - **Runtime orchestration** (hosts/backends/models) for local + remote model stacks
+- **Size-aware runtime probes** so very large GGUF/RPC models get sane startup timeouts by default
 - **Safety + approvals** with explicit modes (`plan`, `reject`, `default`, `auto-edit`, `yolo`)
 - **Headless mode** for CI and scripts (`json`, `stream-json`, `--fail-on-error`, `--diff-only`)
 - **Bot frontends** (Telegram + Discord) with service management
@@ -158,6 +159,24 @@ If you use a dedicated `idlehands` account, install/manage the service while log
 ---
+## Runtime probe defaults (size-aware)
+When a model does not explicitly set probe timeout and probe interval, Idle Hands derives defaults from estimated model size on the target host.
+Default tiers used by idlehands select:
+| Model size (GiB) | probe timeout | probe interval |
+|---:|---:|---:|
+| <= 10 | 120s | 1000ms |
+| <= 40 | 300s | 1200ms |
+| <= 80 | 900s | 2000ms |
+| <= 140 | 3600s | 5000ms |
+| > 140 | 5400s | 5000ms |
+Per-model override remains available in runtimes.json under models.launch.
+Explicit per-model values always take precedence.
 ## Documentation map
 - [Getting Started](https://visorcraft.github.io/IdleHands/guide/getting-started)

package/dist/agent.js CHANGED Viewed

@@ -592,6 +592,14 @@ export function parseToolCallsFromContent(content) {
     const xmlCalls = parseXmlToolCalls(trimmed);
     if (xmlCalls?.length)
         return xmlCalls;
+    // Case 5: Lightweight function-tag calls (seen in some Qwen content-mode outputs):
+    // <function=tool_name>
+    // {...json args...}
+    // </function>
+    // or single-line <function=tool_name>{...}</function>
+    const fnTagCalls = parseFunctionTagToolCalls(trimmed);
+    if (fnTagCalls?.length)
+        return fnTagCalls;
     return null;
 }
 /**
@@ -1006,8 +1014,51 @@ export async function createSession(opts) {
         sessionMeta += `\n\n[Sub-agents] spawn_task is available (isolated context, sequential queue, default max_iterations=${subMaxIter}).`;
     }
     // Harness-driven suffix: append to first user message (NOT system prompt — §9b KV cache rule)
+    // Check if model needs content-mode tool calls (known incompatible templates)
+    // This runs before harness checks so it works regardless of quirk flags.
+    {
+        const modelName = cfg.model ?? '';
+        const { OpenAIClient: OAIClient } = await import('./client.js');
+        if (!client.contentModeToolCalls && OAIClient.needsContentMode(modelName)) {
+            client.contentModeToolCalls = true;
+            client.recordKnownPatternMatch();
+            if (cfg.verbose) {
+                console.warn(`[info] Model "${modelName}" matched known content-mode pattern — using content-based tool calls`);
+            }
+        }
+    }
     if (harness.quirks.needsExplicitToolCallFormatReminder) {
-        sessionMeta += '\n\nIMPORTANT: Use the tool_calls mechanism to invoke tools. Do NOT write JSON tool invocations in your message text.';
+        if (client.contentModeToolCalls) {
+            // In content mode, tell the model to use JSON tool calls in its output
+            sessionMeta += '\n\nYou have access to the following tools. To call a tool, output a JSON block in your response like this:\n```json\n{"name": "tool_name", "arguments": {"param": "value"}}\n```\nAvailable tools:\n';
+            const toolSchemas = getToolsSchema();
+            for (const t of toolSchemas) {
+                const fn = t.function;
+                if (fn) {
+                    const params = fn.parameters?.properties
+                        ? Object.entries(fn.parameters.properties).map(([k, v]) => `${k}: ${v.type ?? 'any'}`).join(', ')
+                        : '';
+                    sessionMeta += `- ${fn.name}(${params}): ${fn.description ?? ''}\n`;
+                }
+            }
+            sessionMeta += '\nIMPORTANT: Output tool calls as JSON blocks in your message. Do NOT use the tool_calls API mechanism.\nIf you use XML/function tags (e.g. <function=name>), include a full JSON object of arguments between braces.';
+        }
+        else {
+            sessionMeta += '\n\nIMPORTANT: Use the tool_calls mechanism to invoke tools. Do NOT write JSON tool invocations in your message text.';
+        }
+        // One-time tool-call template smoke test (first ask() call only, skip in content mode)
+        if (!client.contentModeToolCalls && !client.__toolCallSmokeTested) {
+            client.__toolCallSmokeTested = true;
+            try {
+                const smokeErr = await client.smokeTestToolCalls(cfg.model ?? 'default');
+                if (smokeErr) {
+                    console.error(`\x1b[33m[warn] Tool-call smoke test failed: ${smokeErr}\x1b[0m`);
+                    console.error(`\x1b[33m  This model/server may not support tool-call replay correctly.\x1b[0m`);
+                    console.error(`\x1b[33m  Consider using a different model or updating llama.cpp.\x1b[0m`);
+                }
+            }
+            catch { }
+        }
     }
     if (harness.systemPromptSuffix) {
         sessionMeta += '\n\n' + harness.systemPromptSuffix;
@@ -2212,14 +2263,19 @@ export async function createSession(opts) {
                                 consecutiveCounts.set(sig, 1);
                             }
                             const consec = consecutiveCounts.get(sig) ?? 1;
-                            if (consec >= 4) {
+                            if (consec >= 3) {
                                 const args = sig.slice(toolName.length + 1);
                                 const argsPreview = args.length > 220 ? args.slice(0, 220) + '…' : args;
                                 messages.push({
                                     role: 'user',
-                                    content: `[System] You have read the same resource ${consec} consecutive times (${toolName} ${argsPreview}). The content has not changed. Please proceed with your task using the information you already have.`,
+                                    content: `[System] STOP READING: You have read the same resource ${consec} consecutive times (${toolName} ${argsPreview}). The content has NOT changed. You already have this data. Proceed immediately with your next action (write_file, edit_file, exec, etc.) — do NOT read this resource again.`,
                                 });
                             }
+                            // Hard-break: after 6 consecutive identical reads, stop the session
+                            if (consec >= 6) {
+                                throw new Error(`tool ${toolName}: identical read repeated ${consec}x consecutively; breaking loop. ` +
+                                    `The resource content has not changed between reads.`);
+                            }
                             continue;
                         }
                         // Default behavior for mutating/other tools: break on repeated identical signature.
@@ -2821,4 +2877,30 @@ async function autoPickModel(client, cached) {
         clearTimeout(timer);
     }
 }
+function parseFunctionTagToolCalls(content) {
+    const m = content.match(/<function=([\w.-]+)>([\s\S]*?)<\/function>/i);
+    if (!m)
+        return null;
+    const name = m[1];
+    const body = (m[2] ?? '').trim();
+    // If body contains JSON object, use it as arguments; else empty object.
+    let args = '{}';
+    const jsonStart = body.indexOf('{');
+    const jsonEnd = body.lastIndexOf('}');
+    if (jsonStart !== -1 && jsonEnd > jsonStart) {
+        const sub = body.slice(jsonStart, jsonEnd + 1);
+        try {
+            JSON.parse(sub);
+            args = sub;
+        }
+        catch {
+            // keep {}
+        }
+    }
+    return [{
+            id: 'call_0',
+            type: 'function',
+            function: { name, arguments: args }
+        }];
+}
 //# sourceMappingURL=agent.js.map