npm - @tyvm/knowhow - Versions diffs - 0.0.105 → 0.0.107 - Mend

@tyvm/knowhow 0.0.105 → 0.0.107

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (219) hide show

package/CONFIG.md +8 -5
package/package.json +3 -2
package/scripts/check-model-pricing.ts +509 -0
package/scripts/compare-openrouter-coverage.ts +576 -0
package/src/agents/base/base.ts +169 -5
package/src/agents/tools/execCommand.ts +4 -0
package/src/agents/tools/executeScript/definition.ts +1 -1
package/src/agents/tools/index.ts +0 -1
package/src/agents/tools/list.ts +3 -43
package/src/agents/tools/writeFile.ts +1 -1
package/src/auth/browserLogin.ts +9 -4
package/src/chat/modules/RemoteSyncModule.ts +3 -0
package/src/cli.ts +31 -1
package/src/clients/anthropic.ts +8 -2
package/src/clients/cerebras.ts +10 -0
package/src/clients/contextLimits.ts +7 -2
package/src/clients/copilot.ts +23 -0
package/src/clients/deepseek.ts +16 -0
package/src/clients/fireworks.ts +15 -0
package/src/clients/gemini.ts +59 -4
package/src/clients/github.ts +16 -0
package/src/clients/groq.ts +15 -0
package/src/clients/http.ts +194 -6
package/src/clients/index.ts +116 -4
package/src/clients/llama.ts +16 -0
package/src/clients/mistral.ts +16 -0
package/src/clients/nvidia.ts +16 -0
package/src/clients/openai.ts +53 -12
package/src/clients/openrouter.ts +17 -0
package/src/clients/pricing/anthropic.ts +105 -78
package/src/clients/pricing/cerebras.ts +11 -0
package/src/clients/pricing/copilot.ts +60 -0
package/src/clients/pricing/deepseek.ts +15 -0
package/src/clients/pricing/fireworks.ts +32 -0
package/src/clients/pricing/github.ts +69 -0
package/src/clients/pricing/google.ts +245 -206
package/src/clients/pricing/groq.ts +56 -0
package/src/clients/pricing/index.ts +42 -5
package/src/clients/pricing/llama.ts +18 -0
package/src/clients/pricing/mistral.ts +34 -0
package/src/clients/pricing/models.ts +7 -236
package/src/clients/pricing/nvidia.ts +102 -0
package/src/clients/pricing/openai.ts +348 -171
package/src/clients/pricing/openrouter.ts +36 -0
package/src/clients/pricing/types.ts +83 -2
package/src/clients/pricing/xai.ts +121 -65
package/src/clients/types.ts +28 -1
package/src/clients/xai.ts +161 -1
package/src/fileSync.ts +8 -2
package/src/login.ts +11 -3
package/src/services/AgentSyncFs.ts +36 -12
package/src/services/KnowhowClient.ts +11 -0
package/src/services/LazyToolsService.ts +6 -0
package/src/services/S3.ts +0 -7
package/src/services/modules/index.ts +11 -2
package/src/types.ts +56 -279
package/src/worker.ts +174 -0
package/tests/clients/AIClient.test.ts +1 -1
package/tests/clients/anthropic.test.ts +202 -0
package/tests/clients/pricing.test.ts +37 -0
package/tests/manual/clients/completions.json +838 -226
package/tests/manual/clients/completions.test.ts +46 -31
package/ts_build/package.json +3 -2
package/ts_build/src/agents/base/base.d.ts +18 -1
package/ts_build/src/agents/base/base.js +111 -4
package/ts_build/src/agents/base/base.js.map +1 -1
package/ts_build/src/agents/tools/execCommand.js +3 -0
package/ts_build/src/agents/tools/execCommand.js.map +1 -1
package/ts_build/src/agents/tools/executeScript/definition.js +1 -1
package/ts_build/src/agents/tools/executeScript/definition.js.map +1 -1
package/ts_build/src/agents/tools/index.d.ts +0 -1
package/ts_build/src/agents/tools/index.js +0 -1
package/ts_build/src/agents/tools/index.js.map +1 -1
package/ts_build/src/agents/tools/list.js +3 -38
package/ts_build/src/agents/tools/list.js.map +1 -1
package/ts_build/src/agents/tools/visionTool.d.ts +1 -1
package/ts_build/src/agents/tools/writeFile.js +1 -1
package/ts_build/src/agents/tools/writeFile.js.map +1 -1
package/ts_build/src/ai.d.ts +1 -1
package/ts_build/src/auth/browserLogin.d.ts +2 -1
package/ts_build/src/auth/browserLogin.js +10 -3
package/ts_build/src/auth/browserLogin.js.map +1 -1
package/ts_build/src/chat/modules/RemoteSyncModule.js +1 -0
package/ts_build/src/chat/modules/RemoteSyncModule.js.map +1 -1
package/ts_build/src/cli.js +19 -0
package/ts_build/src/cli.js.map +1 -1
package/ts_build/src/clients/anthropic.d.ts +1 -82
package/ts_build/src/clients/anthropic.js +8 -2
package/ts_build/src/clients/anthropic.js.map +1 -1
package/ts_build/src/clients/cerebras.d.ts +4 -0
package/ts_build/src/clients/cerebras.js +14 -0
package/ts_build/src/clients/cerebras.js.map +1 -0
package/ts_build/src/clients/contextLimits.js +7 -2
package/ts_build/src/clients/contextLimits.js.map +1 -1
package/ts_build/src/clients/copilot.d.ts +4 -0
package/ts_build/src/clients/copilot.js +15 -0
package/ts_build/src/clients/copilot.js.map +1 -0
package/ts_build/src/clients/deepseek.d.ts +4 -0
package/ts_build/src/clients/deepseek.js +15 -0
package/ts_build/src/clients/deepseek.js.map +1 -0
package/ts_build/src/clients/fireworks.d.ts +4 -0
package/ts_build/src/clients/fireworks.js +15 -0
package/ts_build/src/clients/fireworks.js.map +1 -0
package/ts_build/src/clients/gemini.d.ts +1 -0
package/ts_build/src/clients/gemini.js +38 -2
package/ts_build/src/clients/gemini.js.map +1 -1
package/ts_build/src/clients/github.d.ts +4 -0
package/ts_build/src/clients/github.js +15 -0
package/ts_build/src/clients/github.js.map +1 -0
package/ts_build/src/clients/groq.d.ts +4 -0
package/ts_build/src/clients/groq.js +15 -0
package/ts_build/src/clients/groq.js.map +1 -0
package/ts_build/src/clients/http.d.ts +22 -1
package/ts_build/src/clients/http.js +135 -7
package/ts_build/src/clients/http.js.map +1 -1
package/ts_build/src/clients/index.d.ts +14 -0
package/ts_build/src/clients/index.js +94 -4
package/ts_build/src/clients/index.js.map +1 -1
package/ts_build/src/clients/llama.d.ts +4 -0
package/ts_build/src/clients/llama.js +15 -0
package/ts_build/src/clients/llama.js.map +1 -0
package/ts_build/src/clients/mistral.d.ts +4 -0
package/ts_build/src/clients/mistral.js +15 -0
package/ts_build/src/clients/mistral.js.map +1 -0
package/ts_build/src/clients/nvidia.d.ts +4 -0
package/ts_build/src/clients/nvidia.js +15 -0
package/ts_build/src/clients/nvidia.js.map +1 -0
package/ts_build/src/clients/openai.d.ts +4 -206
package/ts_build/src/clients/openai.js +38 -10
package/ts_build/src/clients/openai.js.map +1 -1
package/ts_build/src/clients/openrouter.d.ts +4 -0
package/ts_build/src/clients/openrouter.js +15 -0
package/ts_build/src/clients/openrouter.js.map +1 -0
package/ts_build/src/clients/pricing/anthropic.d.ts +26 -78
package/ts_build/src/clients/pricing/anthropic.js +75 -78
package/ts_build/src/clients/pricing/anthropic.js.map +1 -1
package/ts_build/src/clients/pricing/cerebras.d.ts +4 -0
package/ts_build/src/clients/pricing/cerebras.js +11 -0
package/ts_build/src/clients/pricing/cerebras.js.map +1 -0
package/ts_build/src/clients/pricing/copilot.d.ts +5 -0
package/ts_build/src/clients/pricing/copilot.js +35 -0
package/ts_build/src/clients/pricing/copilot.js.map +1 -0
package/ts_build/src/clients/pricing/deepseek.d.ts +5 -0
package/ts_build/src/clients/pricing/deepseek.js +10 -0
package/ts_build/src/clients/pricing/deepseek.js.map +1 -0
package/ts_build/src/clients/pricing/fireworks.d.ts +5 -0
package/ts_build/src/clients/pricing/fireworks.js +21 -0
package/ts_build/src/clients/pricing/fireworks.js.map +1 -0
package/ts_build/src/clients/pricing/github.d.ts +4 -0
package/ts_build/src/clients/pricing/github.js +58 -0
package/ts_build/src/clients/pricing/github.js.map +1 -0
package/ts_build/src/clients/pricing/google.d.ts +59 -6
package/ts_build/src/clients/pricing/google.js +214 -167
package/ts_build/src/clients/pricing/google.js.map +1 -1
package/ts_build/src/clients/pricing/groq.d.ts +5 -0
package/ts_build/src/clients/pricing/groq.js +41 -0
package/ts_build/src/clients/pricing/groq.js.map +1 -0
package/ts_build/src/clients/pricing/index.d.ts +16 -5
package/ts_build/src/clients/pricing/index.js +62 -7
package/ts_build/src/clients/pricing/index.js.map +1 -1
package/ts_build/src/clients/pricing/llama.d.ts +4 -0
package/ts_build/src/clients/pricing/llama.js +14 -0
package/ts_build/src/clients/pricing/llama.js.map +1 -0
package/ts_build/src/clients/pricing/mistral.d.ts +5 -0
package/ts_build/src/clients/pricing/mistral.js +23 -0
package/ts_build/src/clients/pricing/mistral.js.map +1 -0
package/ts_build/src/clients/pricing/models.d.ts +5 -4
package/ts_build/src/clients/pricing/models.js +8 -162
package/ts_build/src/clients/pricing/models.js.map +1 -1
package/ts_build/src/clients/pricing/nvidia.d.ts +8 -0
package/ts_build/src/clients/pricing/nvidia.js +96 -0
package/ts_build/src/clients/pricing/nvidia.js.map +1 -0
package/ts_build/src/clients/pricing/openai.d.ts +86 -197
package/ts_build/src/clients/pricing/openai.js +295 -168
package/ts_build/src/clients/pricing/openai.js.map +1 -1
package/ts_build/src/clients/pricing/openrouter.d.ts +4 -0
package/ts_build/src/clients/pricing/openrouter.js +29 -0
package/ts_build/src/clients/pricing/openrouter.js.map +1 -0
package/ts_build/src/clients/pricing/types.d.ts +27 -2
package/ts_build/src/clients/pricing/types.js +46 -0
package/ts_build/src/clients/pricing/types.js.map +1 -1
package/ts_build/src/clients/pricing/xai.d.ts +37 -57
package/ts_build/src/clients/pricing/xai.js +92 -59
package/ts_build/src/clients/pricing/xai.js.map +1 -1
package/ts_build/src/clients/types.d.ts +12 -1
package/ts_build/src/clients/xai.d.ts +2 -62
package/ts_build/src/clients/xai.js +132 -1
package/ts_build/src/clients/xai.js.map +1 -1
package/ts_build/src/fileSync.js +7 -2
package/ts_build/src/fileSync.js.map +1 -1
package/ts_build/src/login.js +8 -2
package/ts_build/src/login.js.map +1 -1
package/ts_build/src/services/AgentSyncFs.js +1 -0
package/ts_build/src/services/AgentSyncFs.js.map +1 -1
package/ts_build/src/services/KnowhowClient.d.ts +1 -0
package/ts_build/src/services/KnowhowClient.js +7 -0
package/ts_build/src/services/KnowhowClient.js.map +1 -1
package/ts_build/src/services/LazyToolsService.d.ts +1 -0
package/ts_build/src/services/LazyToolsService.js +3 -0
package/ts_build/src/services/LazyToolsService.js.map +1 -1
package/ts_build/src/services/S3.js +0 -7
package/ts_build/src/services/S3.js.map +1 -1
package/ts_build/src/services/modules/index.js +41 -1
package/ts_build/src/services/modules/index.js.map +1 -1
package/ts_build/src/types.d.ts +163 -124
package/ts_build/src/types.js +33 -213
package/ts_build/src/types.js.map +1 -1
package/ts_build/src/worker.d.ts +4 -0
package/ts_build/src/worker.js +140 -0
package/ts_build/src/worker.js.map +1 -1
package/ts_build/tests/clients/AIClient.test.js +1 -1
package/ts_build/tests/clients/AIClient.test.js.map +1 -1
package/ts_build/tests/clients/anthropic.test.d.ts +1 -0
package/ts_build/tests/clients/anthropic.test.js +159 -0
package/ts_build/tests/clients/anthropic.test.js.map +1 -0
package/ts_build/tests/clients/pricing.test.js +21 -0
package/ts_build/tests/clients/pricing.test.js.map +1 -1
package/ts_build/tests/manual/clients/completions.test.js +27 -24
package/ts_build/tests/manual/clients/completions.test.js.map +1 -1

package/src/agents/base/base.ts CHANGED Viewed

@@ -1,5 +1,6 @@
 import { EventEmitter } from "events"; // kept for reference; agentEvents now uses EventService
 import {
+  CompletionResponse,
   GenericClient,
   Message,
   MessageContent,
@@ -59,6 +60,10 @@ export abstract class BaseAgent implements IAgent {
   protected turnCount = 0;
   protected totalCostUsd = 0;
   protected currentThread = 0;
+  protected totalInputTokens = 0;
+  protected totalOutputTokens = 0;
+  protected totalCacheReadTokens = 0;
+  protected totalCacheWriteTokens = 0;
   protected compressThreshold = 30000;
   protected compressMinMessages = 30;
@@ -95,6 +100,7 @@ export abstract class BaseAgent implements IAgent {
     agentSay: "agent:say",
     agentNewTask: "agent:newTask",
     agentTaskComplete: "agent:taskComplete",
+    tokenUsage: "agent:tokenUsage",
   };
   public tools: ToolsService;
@@ -194,6 +200,10 @@ export abstract class BaseAgent implements IAgent {
     this.taskBreakdown = "";
     this.summaries = [];
     this.totalCostUsd = 0;
+    this.totalInputTokens = 0;
+    this.totalOutputTokens = 0;
+    this.totalCacheReadTokens = 0;
+    this.totalCacheWriteTokens = 0;
     this.status = this.eventTypes.inProgress;
     this.turnCount = 0;
     this.startTimeMs = Date.now();
@@ -283,6 +293,33 @@ export abstract class BaseAgent implements IAgent {
     this.easyFinalAnswer = value;
   }
+  /**
+   * Detect if the model's response is a termination signal (e.g. "Done", "Complete", "Finished", "finalAnswer")
+   * This handles the case where an agent refuses to call finalAnswer and just says a short termination word.
+   */
+  protected isTerminationResponse(content: string): boolean {
+    const trimmed = content.trim();
+    // Short response (≤ 3 words) that matches a termination word/phrase exactly
+    const wordCount = trimmed.split(/\s+/).filter(Boolean).length;
+    if (wordCount <= 3) {
+      const terminationPattern = /^(done|complete|completed|finished|final\s*answer|task\s*complete|all\s*done|that'?s\s*(all|it)|ok(ay)?|yes)[.!]*$/i;
+      if (terminationPattern.test(trimmed)) return true;
+    }
+    // Check if the first 1-3 words indicate task completion (for longer responses)
+    // e.g. "Task complete: ...", "All done.", "No further changes needed.", "Confirmed complete."
+    const firstWords = trimmed.split(/\s+/).slice(0, 3).join(" ");
+    const firstWordPattern = /^(task\s*(complete|completed|done|finished)|all\s*done|no\s*(further|more|additional|changes|action)|confirmed?\s*(complete|done|finished|one\s*last)|nothing\s*(more|further|else)|standing\s*by|everything\s*is|still\s*confirmed|acknowledged|done\s*and|complete\s*(and|\.)|completed\s*successfully|no\s*additional|verified\s*and)/i;
+    if (firstWordPattern.test(firstWords)) return true;
+    // If easyFinalAnswer mode is on, also match response starting with "✅" or numbered confirmation lists
+    if (this.easyFinalAnswer) {
+      if (trimmed.startsWith("✅") || /^[\d\.\-\*]/.test(trimmed)) return true;
+    }
+    return false;
+  }
   getEnabledTools() {
     return this.tools
       .getTools()
@@ -369,6 +406,44 @@ export abstract class BaseAgent implements IAgent {
     return this.totalCostUsd;
   }
+  adjustTokenUsage(usage: any) {
+    if (!usage) return;
+    // Support both OpenAI-style (prompt_tokens/completion_tokens) and Anthropic-style (input_tokens/output_tokens)
+    const inputTokens = usage.input_tokens ?? usage.prompt_tokens ?? 0;
+    const outputTokens = usage.output_tokens ?? usage.completion_tokens ?? 0;
+    const cacheReadTokens =
+      usage.cache_read_input_tokens ?? usage.cache_read_tokens ??
+      usage.prompt_tokens_details?.cached_tokens ?? 0;
+    const cacheWriteTokens =
+      usage.cache_creation_input_tokens ?? usage.cache_write_tokens ?? 0;
+    this.totalInputTokens += inputTokens;
+    this.totalOutputTokens += outputTokens;
+    this.totalCacheReadTokens += cacheReadTokens;
+    this.totalCacheWriteTokens += cacheWriteTokens;
+    this.agentEvents.emit(this.eventTypes.tokenUsage, {
+      inputTokens,
+      outputTokens,
+      cacheReadTokens,
+      cacheWriteTokens,
+      totalInputTokens: this.totalInputTokens,
+      totalOutputTokens: this.totalOutputTokens,
+      totalCacheReadTokens: this.totalCacheReadTokens,
+      totalCacheWriteTokens: this.totalCacheWriteTokens,
+    });
+  }
+  getTokenUsage() {
+    return {
+      totalInputTokens: this.totalInputTokens,
+      totalOutputTokens: this.totalOutputTokens,
+      totalCacheReadTokens: this.totalCacheReadTokens,
+      totalCacheWriteTokens: this.totalCacheWriteTokens,
+    };
+  }
   startNewThread(messages: Message[]) {
     this.currentThread++;
     this.agentEvents.emit(this.eventTypes.newThread, messages);
@@ -544,8 +619,14 @@ export abstract class BaseAgent implements IAgent {
   async kill() {
     this.log("Killing agent");
-    if (this.status === this.eventTypes.kill || this.status === this.eventTypes.done) {
-      this.log("Agent is already being killed or done, ignoring duplicate kill()", "warn");
+    if (
+      this.status === this.eventTypes.kill ||
+      this.status === this.eventTypes.done
+    ) {
+      this.log(
+        "Agent is already being killed or done, ignoring duplicate kill()",
+        "warn"
+      );
       return;
     }
     this.agentEvents.emit(this.eventTypes.kill, this);
@@ -651,15 +732,22 @@ export abstract class BaseAgent implements IAgent {
           "warn"
         );
         const error = response as any;
-        if ("response" in error && "data" in error.response) {
+        if (error != null && "response" in error && "data" in error.response) {
           this.log(
             `Response data: ${JSON.stringify(error.response.data, null, 2)}`,
             "warn"
           );
         }
+        if (!response?.choices) {
+          const errMsg =
+            (error?.error?.message ?? error?.message) ||
+            JSON.stringify(response);
+          throw new Error(`AI response error: ${errMsg}`);
+        }
       }
       this.adjustTotalCostUsd(response?.usd_cost);
+      this.adjustTokenUsage(response?.usage);
       this.log("agent response cost: " + response?.usd_cost);
       // Typically, there's only one choice in the array, but you could have many
@@ -687,6 +775,16 @@ export abstract class BaseAgent implements IAgent {
           this.updateCurrentThread(messages);
+          const truncationWarning = this.detectTruncatedToolCalls(
+            toolCalls,
+            response
+          );
+          if (truncationWarning) {
+            messages.push(truncationWarning as Message);
+            this.updateCurrentThread(messages);
+            return this.call(userInput, messages);
+          }
           for (const toolCall of toolCalls) {
             if (this.status === this.eventTypes.pause) {
               this.log(
@@ -755,6 +853,18 @@ export abstract class BaseAgent implements IAgent {
       // Early exit: not required to call tool
       const firstMessage = response.choices[0].message;
+      // Auto-detect termination words: if the model is just saying "Done", "Complete", etc.
+      if (
+        response.choices.length === 1 &&
+        firstMessage.content &&
+        this.isTerminationResponse(firstMessage.content)
+      ) {
+        this.log(`Termination word detected: "${firstMessage.content.trim()}", treating as finalAnswer`);
+        this.status = this.eventTypes.done;
+        this.agentEvents.emit(this.eventTypes.done, firstMessage.content);
+        return firstMessage.content;
+      }
       if (
         response.choices.length === 1 &&
         firstMessage.content &&
@@ -808,7 +918,7 @@ export abstract class BaseAgent implements IAgent {
         this.logStatus();
         const continuation = `<Workflow>
-        workflow continues until you call one of ${this.requiredToolNames}.\n
+        workflow continues until you call one of ${JSON.stringify(this.requiredToolNames)}.\n
         ${statusMessage}
         </Workflow>`;
@@ -854,7 +964,7 @@ export abstract class BaseAgent implements IAgent {
       this.log(`Agent failed: ${e}`, "error");
-      if ("response" in e && "data" in e.response) {
+      if (e != null && typeof e === "object" && "response" in e && "data" in (e as any).response) {
         this.log(
           `Error response data: ${JSON.stringify(e.response.data, null, 2)}`,
           "error"
@@ -958,6 +1068,60 @@ export abstract class BaseAgent implements IAgent {
     return JSON.stringify(messages).split(" ").length;
   }
+  /**
+   * Detects whether tool call arguments appear truncated due to hitting the output token limit.
+   * Two signals are checked:
+   *   1. Any tool call argument is empty or invalid JSON (hard truncation).
+   *   2. The model reported many output tokens but the total argument content received is tiny
+   *      relative to what those tokens should represent (soft/silent truncation).
+   *
+   * Returns a warning system message if truncation is detected, or null otherwise.
+   */
+  detectTruncatedToolCalls(
+    toolCalls: ToolCall[],
+    response: CompletionResponse
+  ): { role: string; content: string } | null {
+    const outputTokens: number = response?.usage?.completion_tokens || 0;
+    const totalArgLength = toolCalls.reduce(
+      (sum, tc) => sum + (tc.function?.arguments?.length || 0),
+      0
+    );
+    // Percentage-based heuristic: if actual arg chars are less than ~10% of the
+    // expected chars (outputTokens * 4 chars/token), the output was likely truncated.
+    // Only apply when outputTokens > 1000 to avoid false positives on small responses.
+    const expectedArgChars = outputTokens * 4;
+    const suspiciouslySmallArgs =
+      outputTokens > 1000 && totalArgLength < expectedArgChars * 0.1;
+    for (const toolCall of toolCalls) {
+      const args = toolCall.function?.arguments || "";
+      let isInvalidJson = false;
+      try {
+        JSON.parse(args);
+      } catch {
+        isInvalidJson = true;
+      }
+      if (isInvalidJson || args.trim() === "" || suspiciouslySmallArgs) {
+        this.log(
+          `Tool call '${toolCall.function?.name}' has malformed/truncated arguments — likely hit output token limit (outputTokens=${outputTokens}, argLength=${args.length})`,
+          "warn"
+        );
+        return {
+          role: "user",
+          content:
+            "⚠️ Output limit warning: Your last tool call had incomplete or missing arguments, which usually means you exceeded the output token limit mid-response. The model reported " +
+            outputTokens +
+            " output tokens but only " +
+            totalArgLength +
+            " characters of tool call arguments were received. Please write smaller, more concise content in your tool calls. Aim for no more than 4000 tokens of output per response. Break large responses into smaller pieces if needed.",
+        };
+      }
+    }
+    return null;
+  }
   async getTaskBreakdown(messages: Message[]) {
     if (this.taskBreakdown) {
       return this.taskBreakdown;

package/src/agents/tools/execCommand.ts CHANGED Viewed

@@ -262,6 +262,10 @@ export const execCommand = async (
   continueInBackground?: boolean,
   logFileName?: string
 ): Promise<string> => {
+  if(!command || typeof command !== "string") {
+    throw new Error("Invalid command. We received a non-string value. Please ensure you are sending strings of 4k tokens or less.");
+  }
   const { stdout, stderr, timedOut, killed, pid, logPath } =
     await execWithTimeout(command, {
       timeout,

package/src/agents/tools/executeScript/definition.ts CHANGED Viewed

@@ -53,7 +53,7 @@ export const executeScriptDefinition: Tool = {
       properties: {
         script: {
           type: "string",
-          description: "The TypeScript code to execute",
+          description: "The TypeScript code to execute. 4000 tokens or less",
         },
         maxToolCalls: {
           type: "number",

package/src/agents/tools/index.ts CHANGED Viewed

@@ -19,7 +19,6 @@ export * from "./language";
 export * from "./askHuman";
 export * from "./aiClient";
 export * from "./googleSearch";
-export * from "./loadWebpage";
 export * from "./stringReplace";
 export * from "./executeScript";
 export * from "./startAgentTask";

package/src/agents/tools/list.ts CHANGED Viewed

@@ -55,7 +55,7 @@ export const includedTools = [
         properties: {
           command: {
             type: "string",
-            description: "The command to execute",
+            description: "The command to execute. 4000 tokens or less",
           },
           timeout: {
             type: "number",
@@ -346,7 +346,7 @@ export const includedTools = [
     function: {
       name: "writeFileChunk",
       description:
-        "Update or create files by writing in small chunks of text. Suitable for larger files, this tool allows incremental writing by calling it multiple times.",
+        "Update or create files by writing in small chunks of text. Suitable for larger files, this tool allows incremental writing by calling it multiple times. Write chunks of around 4000 tokens",
       parameters: {
         type: "object",
         positional: true,
@@ -358,7 +358,7 @@ export const includedTools = [
           },
           content: {
             type: "string",
-            description: "The chunk of content to write to the file",
+            description: "The chunk of content to write to the file. 4000 tokens or less",
           },
           isContinuing: {
             type: "boolean",
@@ -631,46 +631,6 @@ export const includedTools = [
       },
     },
   },
-  {
-    type: "function",
-    function: {
-      name: "loadWebpage",
-      description:
-        "Load a webpage using a stealth browser to avoid bot detection. Can return either text content with console logs or a screenshot.",
-      parameters: {
-        type: "object",
-        positional: true,
-        properties: {
-          url: {
-            type: "string",
-            description: "The URL of the webpage to load",
-          },
-          mode: {
-            type: "string",
-            description:
-              "The mode for content extraction: 'text' for text content with console logs, 'screenshot' for a base64 encoded screenshot",
-            enum: ["text", "screenshot"],
-          },
-          waitForSelector: {
-            type: "string",
-            description:
-              "Optional CSS selector to wait for before extracting content",
-          },
-          timeout: {
-            type: "number",
-            description:
-              "Timeout in milliseconds for page loading (default: 30000)",
-          },
-        },
-        required: ["url"],
-      },
-      returns: {
-        type: "string",
-        description:
-          "The webpage content as text with console logs, or a base64 encoded screenshot",
-      },
-    },
-  },
   {
     type: "function",
     function: {

package/src/agents/tools/writeFile.ts CHANGED Viewed

@@ -28,7 +28,7 @@ export async function writeFileChunk(
       `File path and content are both required. We received: ${JSON.stringify({
         filePath,
         content,
-      })}. Make sure you write small chunks of content, otherwise you will hit output limits, resulting in content being empty.`
+      })}. Make sure you write small chunks of content (4k tokens), otherwise you will hit output limits, resulting in content being empty.`
     );
   }

package/src/auth/browserLogin.ts CHANGED Viewed

@@ -26,7 +26,7 @@ interface RetrieveTokenResponse {
 export class BrowserLoginService {
   private baseUrl: string;
-  constructor(baseUrl: string = KNOWHOW_API_URL) {
+  constructor(baseUrl: string = KNOWHOW_API_URL, private orgId?: string) {
     if (!baseUrl) {
       throw new BrowserLoginError(
         "KNOWHOW_API_URL environment variable not set"
@@ -52,11 +52,16 @@ export class BrowserLoginService {
       spinner.start("Opening browser for authentication");
       // Step 2: Open browser
-      await openBrowser(sessionData.browserUrl);
+      let browserUrl = sessionData.browserUrl;
+      // Append orgId as query string so the frontend can pre-select the correct organization
+      if (this.orgId) {
+        const separator = browserUrl.includes("?") ? "&" : "?";
+        browserUrl = `${browserUrl}${separator}orgId=${encodeURIComponent(this.orgId)}`;
+      }
+      await openBrowser(browserUrl);
       console.log(
-        `\nIf the browser didn't open automatically, please visit: ${sessionData.browserUrl}\n`
+        `\nIf the browser didn't open automatically, please visit: ${browserUrl}\n`
       );
       spinner.stop();
       spinner.start("Waiting for browser authentication");

package/src/chat/modules/RemoteSyncModule.ts CHANGED Viewed

@@ -247,6 +247,9 @@ export class RemoteSyncModule extends BaseChatModule {
     const registry = this.agentModule.getTaskRegistry();
     const taskInfo = registry.get(taskId);
+    // Refresh JWT in case it was updated since client was instantiated (e.g. after knowhow login)
+    this.client.refreshJwt();
     if (!taskInfo) {
       console.log(
         `⚠️  Task "${taskId}" not found in registry.`

package/src/cli.ts CHANGED Viewed

@@ -14,9 +14,10 @@ import { includedTools } from "./agents/tools/list";
 import * as allTools from "./agents/tools";
 import { LazyToolsService, services } from "./services";
 import { login } from "./login";
-import { worker } from "./worker";
+import { worker, tunnel } from "./worker";
 import { fileSync } from "./fileSync";
 import { KnowhowSimpleClient } from "./services/KnowhowClient";
+import { ModulesService } from "./services/modules";
 import {
   startAllWorkers,
   listWorkerPaths,
@@ -56,6 +57,7 @@ async function setupServices() {
   const { Agents, Mcp, Clients, Tools: OldTools } = services();
   const Tools = new LazyToolsService(); // eslint-disable-line no-shadow
+  // Load modules from config first so module-provided tools/agents/plugins are available
   // We need to wireup the LazyTools to be connected to the same singletons that are in services()
   Tools.setContext({
     ...OldTools.getContext(),
@@ -100,6 +102,19 @@ async function setupServices() {
   await Clients.registerConfiguredModels();
   console.log("✓ Services are set up and ready to go!");
+  // Load modules (tools, plugins, agents) from knowhow.json config
+  console.log("📦 Loading modules from config...");
+  const modulesService = new ModulesService();
+  await modulesService.loadModulesFromConfig({
+    Agents,
+    Embeddings: services().Embeddings,
+    Plugins: services().Plugins,
+    Clients,
+    // Use LazyToolsService so module-provided tools are visible to agents and scripts
+    Tools: Tools as any,
+    MediaProcessor: services().MediaProcessor,
+  });
   // Return both LazyToolsService (for agents) and OldTools (plain ToolsService with all tools for scripts)
   return { Tools, Clients, PlainTools: OldTools };
 }
@@ -527,6 +542,21 @@ async function main() {
       }
     });
+  program
+    .command("tunnel")
+    .description(
+      "Start tunnel-only mode: expose local ports to the cloud without registering any tools"
+    )
+    .option(
+      "--share",
+      "Share this tunnel with your organization (allows other users to use it)"
+    )
+    .option("--unshare", "Make this tunnel private (only you can use it)")
+    .action(async (options) => {
+      await tunnel(options);
+    });
   program
     .command("script")
     .description("Run a local tool script file using the executeScript sandbox")

package/src/clients/anthropic.ts CHANGED Viewed

@@ -207,7 +207,7 @@ export class GenericAnthropicClient implements GenericClient {
     const toolCalls = messages.flatMap((msg) => msg.tool_calls || []);
     const claudeMessages: MessageParam[] = messages
       .filter((msg) => msg.role !== "system")
-      .filter((msg) => msg.content)
+      .filter((msg) => msg.content || msg.role === "tool")
       .map((msg) => {
         if (msg.role === "tool") {
           const toolCall = toolCalls.find((tc) => tc.id === msg.tool_call_id);
@@ -412,7 +412,13 @@ export class GenericAnthropicClient implements GenericClient {
         }),
         model: options.model,
-        usage: response.usage,
+        usage: response.usage ? {
+          prompt_tokens: response.usage.input_tokens ?? 0,
+          completion_tokens: response.usage.output_tokens ?? 0,
+          total_tokens: (response.usage.input_tokens ?? 0) + (response.usage.output_tokens ?? 0),
+          cache_creation_input_tokens: response.usage.cache_creation_input_tokens ?? 0,
+          cache_read_input_tokens: response.usage.cache_read_input_tokens ?? 0,
+        } : undefined,
         usd_cost: this.calculateCost(options.model, response.usage),
       };
     } catch (err) {

package/src/clients/cerebras.ts ADDED Viewed

@@ -0,0 +1,10 @@
+import { HttpClient } from "./http";
+import { CerebrasTextPricing } from "./pricing/cerebras";
+export class GenericCerebrasClient extends HttpClient {
+  constructor(apiKey: string) {
+    super("https://api.cerebras.ai");
+    this.setJwt(apiKey);
+    this.setPrices(CerebrasTextPricing);
+  }
+}

package/src/clients/contextLimits.ts CHANGED Viewed

@@ -19,8 +19,8 @@ export const ContextLimits: Record<string, number> = {
   [Models.openai.GPT_5]: 1_000_000,
   [Models.openai.GPT_5_Mini]: 1_000_000,
   [Models.openai.GPT_5_Nano]: 1_000_000,
-  [Models.openai.GPT_5_1]: 1_000_000,
-  [Models.openai.GPT_5_2]: 1_000_000,
+  [Models.openai.GPT_51]: 1_000_000,
+  [Models.openai.GPT_52]: 1_000_000,
   [Models.openai.GPT_41]: 1_047_576,
   [Models.openai.GPT_41_Mini]: 1_047_576,
   [Models.openai.GPT_41_Nano]: 1_047_576,
@@ -43,6 +43,7 @@ export const ContextLimits: Record<string, number> = {
   // ─── Anthropic ────────────────────────────────────────────────────────────
   [Models.anthropic.Opus4_6]: 1_000_000,
+  [Models.anthropic.Opus4_6Fast]: 1_000_000,
   [Models.anthropic.Sonnet4_6]: 1_000_000,
   [Models.anthropic.Opus4_5]: 1_000_000,
   [Models.anthropic.Opus4]: 200_000,
@@ -54,6 +55,7 @@ export const ContextLimits: Record<string, number> = {
   [Models.anthropic.Sonnet3_5]: 200_000,
   [Models.anthropic.Opus3]: 200_000,
   [Models.anthropic.Haiku3]: 200_000,
+  [Models.anthropic.Haiku3_5]: 200_000,
   // ─── Google ───────────────────────────────────────────────────────────────
   [Models.google.Gemini_31_Pro_Preview]: 1_000_000,
@@ -82,6 +84,9 @@ export const ContextLimits: Record<string, number> = {
   // ─── xAI ──────────────────────────────────────────────────────────────────
   [Models.xai.Grok4_1_Fast_Reasoning]: 2_000_000,
   [Models.xai.Grok4_1_Fast_NonReasoning]: 2_000_000,
+  [Models.xai.Grok_4_20_Reasoning]: 131_072,
+  [Models.xai.Grok_4_20_NonReasoning]: 131_072,
+  [Models.xai.Grok_4_20_MultiAgent]: 2_000_000,
   [Models.xai.GrokCodeFast]: 2_000_000,
   [Models.xai.Grok4]: 131_072,
   [Models.xai.Grok3Beta]: 131_072,

package/src/clients/copilot.ts ADDED Viewed

@@ -0,0 +1,23 @@
+import { HttpClient } from "./http";
+import { CopilotTextPricing } from "./pricing/copilot";
+/**
+ * GitHub Copilot client — OpenAI-compatible API
+ * https://docs.github.com/en/copilot/reference/ai-models/supported-models
+ *
+ * GitHub Copilot exposes an OpenAI-compatible endpoint at https://api.githubcopilot.com
+ * that allows subscribers to use premium models (Claude Opus, GPT-5.x, Gemini, Grok etc.)
+ * via their Copilot subscription's premium request allowance — no per-token charges.
+ *
+ * Authentication: uses a GitHub token (same as GITHUB_TOKEN / a personal access token
+ * or OAuth token with copilot scope).
+ *
+ * Set env var GITHUB_COPILOT_TOKEN (preferred) or GITHUB_TOKEN to enable.
+ */
+export class GitHubCopilotClient extends HttpClient {
+  constructor(apiKey = process.env.GITHUB_COPILOT_TOKEN ?? process.env.GITHUB_TOKEN) {
+    super("https://api.githubcopilot.com");
+    if (apiKey) this.setJwt(apiKey);
+    this.setPrices(CopilotTextPricing);
+  }
+}

package/src/clients/deepseek.ts ADDED Viewed

@@ -0,0 +1,16 @@
+import { HttpClient } from "./http";
+import { DeepSeekTextPricing } from "./pricing/deepseek";
+/**
+ * DeepSeek client — OpenAI-compatible API
+ * https://platform.deepseek.com/api-docs/
+ * Industry-leading reasoning (R1) and coding (V3) models at very low cost.
+ * Set env var DEEPSEEK_API_KEY to enable.
+ */
+export class GenericDeepSeekClient extends HttpClient {
+  constructor(apiKey = process.env.DEEPSEEK_API_KEY) {
+    super("https://api.deepseek.com");
+    if (apiKey) this.setJwt(apiKey);
+    this.setPrices(DeepSeekTextPricing);
+  }
+}

package/src/clients/fireworks.ts ADDED Viewed

@@ -0,0 +1,15 @@
+import { HttpClient } from "./http";
+import { FireworksTextPricing } from "./pricing/fireworks";
+/**
+ * Fireworks AI client — OpenAI-compatible API (fast serverless inference)
+ * https://docs.fireworks.ai/api-reference/introduction
+ * Set env var FIREWORKS_API_KEY to enable.
+ */
+export class GenericFireworksClient extends HttpClient {
+  constructor(apiKey = process.env.FIREWORKS_API_KEY) {
+    super("https://api.fireworks.ai/inference");
+    if (apiKey) this.setJwt(apiKey);
+    this.setPrices(FireworksTextPricing);
+  }
+}