npm - @ztimson/ai-utils - Versions diffs - 0.6.3 → 0.6.5 - Mend

@ztimson/ai-utils 0.6.3 → 0.6.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (5) hide show

package/dist/index.mjs CHANGED Viewed

@@ -1,21 +1,23 @@
-import * as j from "node:os";
-import { objectMap as k, JSONAttemptParse as g, findByProp as x, JSONSanitize as b, clean as T, Http as P, consoleInterceptor as q, fn as $, ASet as M } from "@ztimson/utils";
-import { Anthropic as E } from "@anthropic-ai/sdk";
-import { OpenAI as O } from "openai";
-import { Worker as A } from "worker_threads";
-import { fileURLToPath as R } from "url";
-import { join as v, dirname as U } from "path";
-import { spawn as w } from "node:child_process";
-import { pipeline as z, read_audio as L } from "@xenova/transformers";
-import { createWorker as N } from "tesseract.js";
+import * as P from "node:os";
+import { objectMap as x, JSONAttemptParse as b, findByProp as S, JSONSanitize as w, clean as q, Http as $, consoleInterceptor as M, fn as E, ASet as A } from "@ztimson/utils";
+import { Anthropic as O } from "@anthropic-ai/sdk";
+import { OpenAI as v } from "openai";
+import { Worker as R } from "worker_threads";
+import { fileURLToPath as U } from "url";
+import { join as z, dirname as L } from "path";
+import { spawn as k } from "node:child_process";
+import { pipeline as N } from "@xenova/transformers";
+import * as W from "node:fs";
+import C from "wavefile";
+import { createWorker as D } from "tesseract.js";
 import "./embedder.mjs";
-import * as C from "cheerio";
-import { $ as W, $Sync as D } from "@ztimson/node-utils";
-class S {
+import * as I from "cheerio";
+import { $ as F, $Sync as H } from "@ztimson/node-utils";
+class j {
 }
-class I extends S {
+class J extends j {
   constructor(r, e, t) {
-    super(), this.ai = r, this.apiToken = e, this.model = t, this.client = new E({ apiKey: e });
+    super(), this.ai = r, this.apiToken = e, this.model = t, this.client = new O({ apiKey: e });
   }
   client;
   toStandard(r) {
@@ -24,15 +26,15 @@ class I extends S {
       if (typeof i.content == "string")
         t.push({ timestamp: e, ...i });
       else {
-        const n = i.content?.filter((s) => s.type == "text").map((s) => s.text).join(`
+        const s = i.content?.filter((n) => n.type == "text").map((n) => n.text).join(`
 `);
-        n && t.push({ timestamp: e, role: i.role, content: n }), i.content.forEach((s) => {
-          if (s.type == "tool_use")
-            t.push({ timestamp: e, role: "tool", id: s.id, name: s.name, args: s.input, content: void 0 });
-          else if (s.type == "tool_result") {
-            const o = t.findLast((a) => a.id == s.tool_use_id);
-            o && (o[s.is_error ? "error" : "content"] = s.content);
+        s && t.push({ timestamp: e, role: i.role, content: s }), i.content.forEach((n) => {
+          if (n.type == "tool_use")
+            t.push({ timestamp: e, role: "tool", id: n.id, name: n.name, args: n.input, content: void 0 });
+          else if (n.type == "tool_result") {
+            const o = t.findLast((a) => a.id == n.tool_use_id);
+            o && (o[n.is_error ? "error" : "content"] = n.content);
           }
         });
       }
@@ -54,34 +56,34 @@ class I extends S {
   ask(r, e = {}) {
     const t = new AbortController();
     return Object.assign(new Promise(async (i) => {
-      let n = this.fromStandard([...e.history || [], { role: "user", content: r, timestamp: Date.now() }]);
-      const s = e.tools || this.ai.options.llm?.tools || [], o = {
+      let s = this.fromStandard([...e.history || [], { role: "user", content: r, timestamp: Date.now() }]);
+      const n = e.tools || this.ai.options.llm?.tools || [], o = {
         model: e.model || this.model,
         max_tokens: e.max_tokens || this.ai.options.llm?.max_tokens || 4096,
         system: e.system || this.ai.options.llm?.system || "",
         temperature: e.temperature || this.ai.options.llm?.temperature || 0.7,
-        tools: s.map((d) => ({
+        tools: n.map((d) => ({
           name: d.name,
           description: d.description,
           input_schema: {
             type: "object",
-            properties: d.args ? k(d.args, (c, m) => ({ ...m, required: void 0 })) : {},
+            properties: d.args ? x(d.args, (c, l) => ({ ...l, required: void 0 })) : {},
             required: d.args ? Object.entries(d.args).filter((c) => c[1].required).map((c) => c[0]) : []
           },
           fn: void 0
         })),
-        messages: n,
+        messages: s,
         stream: !!e.stream
       };
-      let a, l = !0;
+      let a, m = !0;
       do {
         if (a = await this.client.messages.create(o).catch((c) => {
           throw c.message += `
 Messages:
-${JSON.stringify(n, null, 2)}`, c;
+${JSON.stringify(s, null, 2)}`, c;
         }), e.stream) {
-          l ? l = !1 : e.stream({ text: `
+          m ? m = !1 : e.stream({ text: `
 ` }), a.content = [];
           for await (const c of a) {
@@ -90,41 +92,41 @@ ${JSON.stringify(n, null, 2)}`, c;
               c.content_block.type === "text" ? a.content.push({ type: "text", text: "" }) : c.content_block.type === "tool_use" && a.content.push({ type: "tool_use", id: c.content_block.id, name: c.content_block.name, input: "" });
             else if (c.type === "content_block_delta")
               if (c.delta.type === "text_delta") {
-                const m = c.delta.text;
-                a.content.at(-1).text += m, e.stream({ text: m });
+                const l = c.delta.text;
+                a.content.at(-1).text += l, e.stream({ text: l });
               } else c.delta.type === "input_json_delta" && (a.content.at(-1).input += c.delta.partial_json);
             else if (c.type === "content_block_stop") {
-              const m = a.content.at(-1);
-              m.input != null && (m.input = m.input ? g(m.input, {}) : {});
+              const l = a.content.at(-1);
+              l.input != null && (l.input = l.input ? b(l.input, {}) : {});
             } else if (c.type === "message_stop")
               break;
           }
         }
         const d = a.content.filter((c) => c.type === "tool_use");
         if (d.length && !t.signal.aborted) {
-          n.push({ role: "assistant", content: a.content });
-          const c = await Promise.all(d.map(async (m) => {
-            const h = s.find(x("name", m.name));
-            if (e.stream && e.stream({ tool: m.name }), !h) return { tool_use_id: m.id, is_error: !0, content: "Tool not found" };
+          s.push({ role: "assistant", content: a.content });
+          const c = await Promise.all(d.map(async (l) => {
+            const h = n.find(S("name", l.name));
+            if (e.stream && e.stream({ tool: l.name }), !h) return { tool_use_id: l.id, is_error: !0, content: "Tool not found" };
             try {
-              const u = await h.fn(m.input, e?.stream, this.ai);
-              return { type: "tool_result", tool_use_id: m.id, content: b(u) };
+              const u = await h.fn(l.input, e?.stream, this.ai);
+              return { type: "tool_result", tool_use_id: l.id, content: w(u) };
             } catch (u) {
-              return { type: "tool_result", tool_use_id: m.id, is_error: !0, content: u?.message || u?.toString() || "Unknown" };
+              return { type: "tool_result", tool_use_id: l.id, is_error: !0, content: u?.message || u?.toString() || "Unknown" };
             }
           }));
-          n.push({ role: "user", content: c }), o.messages = n;
+          s.push({ role: "user", content: c }), o.messages = s;
         }
       } while (!t.signal.aborted && a.content.some((d) => d.type === "tool_use"));
-      n.push({ role: "assistant", content: a.content.filter((d) => d.type == "text").map((d) => d.text).join(`
+      s.push({ role: "assistant", content: a.content.filter((d) => d.type == "text").map((d) => d.text).join(`
-`) }), n = this.toStandard(n), e.stream && e.stream({ done: !0 }), e.history && e.history.splice(0, e.history.length, ...n), i(n.at(-1)?.content);
+`) }), s = this.toStandard(s), e.stream && e.stream({ done: !0 }), e.history && e.history.splice(0, e.history.length, ...s), i(s.at(-1)?.content);
     }), { abort: () => t.abort() });
   }
 }
-class _ extends S {
+class _ extends j {
   constructor(r, e, t, i) {
-    super(), this.ai = r, this.host = e, this.token = t, this.model = i, this.client = new O(T({
+    super(), this.ai = r, this.host = e, this.token = t, this.model = i, this.client = new v(q({
       baseURL: e,
       apiKey: t
     }));
@@ -134,16 +136,16 @@ class _ extends S {
     for (let e = 0; e < r.length; e++) {
       const t = r[e];
       if (t.role === "assistant" && t.tool_calls) {
-        const i = t.tool_calls.map((n) => ({
+        const i = t.tool_calls.map((s) => ({
           role: "tool",
-          id: n.id,
-          name: n.function.name,
-          args: g(n.function.arguments, {}),
+          id: s.id,
+          name: s.function.name,
+          args: b(s.function.arguments, {}),
           timestamp: t.timestamp
         }));
         r.splice(e, 1, ...i), e += i.length - 1;
       } else if (t.role === "tool" && t.content) {
-        const i = r.find((n) => t.tool_call_id == n.id);
+        const i = r.find((s) => t.tool_call_id == s.id);
         i && (t.content.includes('"error":') ? i.error = t.content : i.content = t.content), r.splice(e, 1), e--;
       }
       r[e]?.timestamp || (r[e].timestamp = Date.now());
@@ -165,20 +167,20 @@ class _ extends S {
           content: t.error || t.content
         });
       else {
-        const { timestamp: i, ...n } = t;
-        e.push(n);
+        const { timestamp: i, ...s } = t;
+        e.push(s);
       }
       return e;
     }, []);
   }
   ask(r, e = {}) {
     const t = new AbortController();
-    return Object.assign(new Promise(async (i, n) => {
+    return Object.assign(new Promise(async (i, s) => {
       e.system && e.history?.[0]?.role != "system" && e.history?.splice(0, 0, { role: "system", content: e.system, timestamp: Date.now() });
-      let s = this.fromStandard([...e.history || [], { role: "user", content: r, timestamp: Date.now() }]);
+      let n = this.fromStandard([...e.history || [], { role: "user", content: r, timestamp: Date.now() }]);
       const o = e.tools || this.ai.options.llm?.tools || [], a = {
         model: e.model || this.model,
-        messages: s,
+        messages: n,
         stream: !!e.stream,
         max_tokens: e.max_tokens || this.ai.options.llm?.max_tokens || 4096,
         temperature: e.temperature || this.ai.options.llm?.temperature || 0.7,
@@ -189,55 +191,55 @@ class _ extends S {
             description: c.description,
             parameters: {
               type: "object",
-              properties: c.args ? k(c.args, (m, h) => ({ ...h, required: void 0 })) : {},
-              required: c.args ? Object.entries(c.args).filter((m) => m[1].required).map((m) => m[0]) : []
+              properties: c.args ? x(c.args, (l, h) => ({ ...h, required: void 0 })) : {},
+              required: c.args ? Object.entries(c.args).filter((l) => l[1].required).map((l) => l[0]) : []
             }
           }
         }))
       };
-      let l, d = !0;
+      let m, d = !0;
       do {
-        if (l = await this.client.chat.completions.create(a).catch((m) => {
-          throw m.message += `
+        if (m = await this.client.chat.completions.create(a).catch((l) => {
+          throw l.message += `
 Messages:
-${JSON.stringify(s, null, 2)}`, m;
+${JSON.stringify(n, null, 2)}`, l;
         }), e.stream) {
           d ? d = !1 : e.stream({ text: `
-` }), l.choices = [{ message: { content: "", tool_calls: [] } }];
-          for await (const m of l) {
+` }), m.choices = [{ message: { content: "", tool_calls: [] } }];
+          for await (const l of m) {
             if (t.signal.aborted) break;
-            m.choices[0].delta.content && (l.choices[0].message.content += m.choices[0].delta.content, e.stream({ text: m.choices[0].delta.content })), m.choices[0].delta.tool_calls && (l.choices[0].message.tool_calls = m.choices[0].delta.tool_calls);
+            l.choices[0].delta.content && (m.choices[0].message.content += l.choices[0].delta.content, e.stream({ text: l.choices[0].delta.content })), l.choices[0].delta.tool_calls && (m.choices[0].message.tool_calls = l.choices[0].delta.tool_calls);
           }
         }
-        const c = l.choices[0].message.tool_calls || [];
+        const c = m.choices[0].message.tool_calls || [];
         if (c.length && !t.signal.aborted) {
-          s.push(l.choices[0].message);
-          const m = await Promise.all(c.map(async (h) => {
-            const u = o?.find(x("name", h.function.name));
+          n.push(m.choices[0].message);
+          const l = await Promise.all(c.map(async (h) => {
+            const u = o?.find(S("name", h.function.name));
             if (e.stream && e.stream({ tool: h.function.name }), !u) return { role: "tool", tool_call_id: h.id, content: '{"error": "Tool not found"}' };
             try {
-              const f = g(h.function.arguments, {}), y = await u.fn(f, e.stream, this.ai);
-              return { role: "tool", tool_call_id: h.id, content: b(y) };
+              const f = b(h.function.arguments, {}), y = await u.fn(f, e.stream, this.ai);
+              return { role: "tool", tool_call_id: h.id, content: w(y) };
             } catch (f) {
-              return { role: "tool", tool_call_id: h.id, content: b({ error: f?.message || f?.toString() || "Unknown" }) };
+              return { role: "tool", tool_call_id: h.id, content: w({ error: f?.message || f?.toString() || "Unknown" }) };
             }
           }));
-          s.push(...m), a.messages = s;
+          n.push(...l), a.messages = n;
         }
-      } while (!t.signal.aborted && l.choices?.[0]?.message?.tool_calls?.length);
-      s.push({ role: "assistant", content: l.choices[0].message.content || "" }), s = this.toStandard(s), e.stream && e.stream({ done: !0 }), e.history && e.history.splice(0, e.history.length, ...s), i(s.at(-1)?.content);
+      } while (!t.signal.aborted && m.choices?.[0]?.message?.tool_calls?.length);
+      n.push({ role: "assistant", content: m.choices[0].message.content || "" }), n = this.toStandard(n), e.stream && e.stream({ done: !0 }), e.history && e.history.splice(0, e.history.length, ...n), i(n.at(-1)?.content);
     }), { abort: () => t.abort() });
   }
 }
-class H {
+class B {
   constructor(r) {
-    this.ai = r, this.embedWorker = new A(v(U(R(import.meta.url)), "embedder.js")), this.embedWorker.on("message", ({ id: e, embedding: t }) => {
+    this.ai = r, this.embedWorker = new R(z(L(U(import.meta.url)), "embedder.js")), this.embedWorker.on("message", ({ id: e, embedding: t }) => {
       const i = this.embedQueue.get(e);
       i && (i.resolve(t), this.embedQueue.delete(e));
     }), r.options.llm?.models && Object.entries(r.options.llm.models).forEach(([e, t]) => {
-      this.defaultModel || (this.defaultModel = e), t.proto == "anthropic" ? this.models[e] = new I(this.ai, t.token, e) : t.proto == "ollama" ? this.models[e] = new _(this.ai, t.host, "not-needed", e) : t.proto == "openai" && (this.models[e] = new _(this.ai, t.host || null, t.token, e));
+      this.defaultModel || (this.defaultModel = e), t.proto == "anthropic" ? this.models[e] = new J(this.ai, t.token, e) : t.proto == "ollama" ? this.models[e] = new _(this.ai, t.host, "not-needed", e) : t.proto == "openai" && (this.models[e] = new _(this.ai, t.host || null, t.token, e));
     });
   }
   embedWorker = null;
@@ -256,20 +258,20 @@ class H {
     if (!this.models[t]) throw new Error(`Model does not exist: ${t}`);
     let i = () => {
     };
-    return Object.assign(new Promise(async (n) => {
+    return Object.assign(new Promise(async (s) => {
       if (e.history || (e.history = []), e.memory) {
         e.system = (e.system || "") + `
 You have passive persistent memory never make any mention of your memory capabilities and what you can/cannot remember
 `;
-        const o = async (l, d, c = 50) => {
-          const [m, h] = await Promise.all([
+        const o = async (m, d, c = 50) => {
+          const [l, h] = await Promise.all([
             d ? this.embedding(d) : Promise.resolve(null),
-            l ? this.embedding(l) : Promise.resolve(null)
+            m ? this.embedding(m) : Promise.resolve(null)
           ]);
-          return (e.memory || []).map((u) => ({ ...u, score: m ? this.cosineSimilarity(u.embeddings[0], m[0].embedding) : 1 })).filter((u) => u.score >= 0.8).map((u) => ({ ...u, score: h ? this.cosineSimilarity(u.embeddings[1], h[0].embedding) : u.score })).filter((u) => u.score >= 0.2).toSorted((u, f) => u.score - f.score).slice(0, c);
+          return (e.memory || []).map((u) => ({ ...u, score: l ? this.cosineSimilarity(u.embeddings[0], l[0].embedding) : 1 })).filter((u) => u.score >= 0.8).map((u) => ({ ...u, score: h ? this.cosineSimilarity(u.embeddings[1], h[0].embedding) : u.score })).filter((u) => u.score >= 0.2).toSorted((u, f) => u.score - f.score).slice(0, c);
         }, a = await o(r);
         a.length && e.history.push({ role: "assistant", content: `Things I remembered:
-` + a.map((l) => `${l.owner}: ${l.fact}`).join(`
+` + a.map((m) => `${m.owner}: ${m.fact}`).join(`
 `) }), e.tools = [...e.tools || [], {
           name: "read_memory",
           description: "Check your long-term memory for more information",
@@ -278,13 +280,13 @@ You have passive persistent memory never make any mention of your memory capabil
             query: { type: "string", description: "Search memory based on a query, can be used with or without subject argument" },
             limit: { type: "number", description: "Result limit, default 5" }
           },
-          fn: (l) => {
-            if (!l.subject && !l.query) throw new Error("Either a subject or query argument is required");
-            return o(l.query, l.subject, l.limit || 5);
+          fn: (m) => {
+            if (!m.subject && !m.query) throw new Error("Either a subject or query argument is required");
+            return o(m.query, m.subject, m.limit || 5);
           }
         }];
       }
-      const s = await this.models[t].ask(r, e);
+      const n = await this.models[t].ask(r, e);
       if (e.memory) {
         const o = e.history?.findIndex((a) => a.role == "assistant" && a.content.startsWith("Things I remembered:"));
         o != null && o >= 0 && e.history?.splice(o, 1);
@@ -294,15 +296,15 @@ You have passive persistent memory never make any mention of your memory capabil
         if (e.compress)
           o = await this.ai.language.compressHistory(e.history, e.compress.max, e.compress.min, e), e.history.splice(0, e.history.length, ...o.history);
         else {
-          const a = e.history?.findLastIndex((l) => l.role == "user") ?? -1;
+          const a = e.history?.findLastIndex((m) => m.role == "user") ?? -1;
           o = await this.ai.language.compressHistory(a != -1 ? e.history.slice(a) : e.history, 0, 0, e);
         }
         if (e.memory) {
-          const a = e.memory.filter((l) => !o.memory.some((d) => this.cosineSimilarity(l.embeddings[1], d.embeddings[1]) > 0.8)).concat(o.memory);
+          const a = e.memory.filter((m) => !o.memory.some((d) => this.cosineSimilarity(m.embeddings[1], d.embeddings[1]) > 0.8)).concat(o.memory);
           e.memory.splice(0, e.memory.length, ...a);
         }
       }
-      return n(s);
+      return s(n);
     }), { abort: i });
   }
   /**
@@ -315,20 +317,20 @@ You have passive persistent memory never make any mention of your memory capabil
    */
   async compressHistory(r, e, t, i) {
     if (this.estimateTokens(r) < e) return { history: r, memory: [] };
-    let n = 0, s = 0;
+    let s = 0, n = 0;
     for (let u of r.toReversed())
-      if (s += this.estimateTokens(u.content), s < t) n++;
+      if (n += this.estimateTokens(u.content), n < t) s++;
       else break;
-    if (r.length <= n) return { history: r, memory: [] };
-    const o = r[0].role == "system" ? r[0] : null, a = n == 0 ? [] : r.slice(-n), l = (n == 0 ? r : r.slice(0, -n)).filter((u) => u.role === "assistant" || u.role === "user"), d = await this.json(`Create the smallest summary possible, no more than 500 tokens. Create a list of NEW facts (split by subject [pro]noun and fact) about what you learned from this conversation that you didn't already know or get from a tool call or system prompt. Focus only on new information about people, topics, or facts. Avoid generating facts about the AI. Match this format: {summary: string, facts: [[subject, fact]]}
+    if (r.length <= s) return { history: r, memory: [] };
+    const o = r[0].role == "system" ? r[0] : null, a = s == 0 ? [] : r.slice(-s), m = (s == 0 ? r : r.slice(0, -s)).filter((u) => u.role === "assistant" || u.role === "user"), d = await this.json(`Create the smallest summary possible, no more than 500 tokens. Create a list of NEW facts (split by subject [pro]noun and fact) about what you learned from this conversation that you didn't already know or get from a tool call or system prompt. Focus only on new information about people, topics, or facts. Avoid generating facts about the AI. Match this format: {summary: string, facts: [[subject, fact]]}
-${l.map((u) => `${u.role}: ${u.content}`).join(`
+${m.map((u) => `${u.role}: ${u.content}`).join(`
-`)}`, { model: i?.model, temperature: i?.temperature || 0.3 }), c = /* @__PURE__ */ new Date(), m = await Promise.all((d?.facts || [])?.map(async ([u, f]) => {
+`)}`, { model: i?.model, temperature: i?.temperature || 0.3 }), c = /* @__PURE__ */ new Date(), l = await Promise.all((d?.facts || [])?.map(async ([u, f]) => {
       const y = await Promise.all([this.embedding(u), this.embedding(`${u}: ${f}`)]);
       return { owner: u, fact: f, embeddings: [y[0][0].embedding, y[1][0].embedding], timestamp: c };
     })), h = [{ role: "assistant", content: `Conversation Summary: ${d?.summary}`, timestamp: Date.now() }, ...a];
-    return o && h.splice(0, 0, o), { history: h, memory: m };
+    return o && h.splice(0, 0, o), { history: h, memory: l };
   }
   /**
    * Compare the difference between embeddings (calculates the angle between two vectors)
@@ -338,11 +340,11 @@ ${l.map((u) => `${u.role}: ${u.content}`).join(`
    */
   cosineSimilarity(r, e) {
     if (r.length !== e.length) throw new Error("Vectors must be same length");
-    let t = 0, i = 0, n = 0;
+    let t = 0, i = 0, s = 0;
     for (let o = 0; o < r.length; o++)
-      t += r[o] * e[o], i += r[o] * r[o], n += e[o] * e[o];
-    const s = Math.sqrt(i) * Math.sqrt(n);
-    return s === 0 ? 0 : t / s;
+      t += r[o] * e[o], i += r[o] * r[o], s += e[o] * e[o];
+    const n = Math.sqrt(i) * Math.sqrt(s);
+    return n === 0 ? 0 : t / n;
   }
   /**
    * Chunk text into parts for AI digestion
@@ -352,21 +354,21 @@ ${l.map((u) => `${u.role}: ${u.content}`).join(`
    * @returns {string[]} Chunked strings
    */
   chunk(r, e = 500, t = 50) {
-    const i = (a, l = "") => a ? Object.entries(a).flatMap(([d, c]) => {
-      const m = l ? `${l}${isNaN(+d) ? `.${d}` : `[${d}]`}` : d;
-      return typeof c == "object" && !Array.isArray(c) ? i(c, m) : `${m}: ${Array.isArray(c) ? c.join(", ") : c}`;
-    }) : [], s = (typeof r == "object" ? i(r) : r.split(`
+    const i = (a, m = "") => a ? Object.entries(a).flatMap(([d, c]) => {
+      const l = m ? `${m}${isNaN(+d) ? `.${d}` : `[${d}]`}` : d;
+      return typeof c == "object" && !Array.isArray(c) ? i(c, l) : `${l}: ${Array.isArray(c) ? c.join(", ") : c}`;
+    }) : [], n = (typeof r == "object" ? i(r) : r.split(`
 `)).flatMap((a) => [...a.split(/\s+/).filter(Boolean), `
 `]), o = [];
-    for (let a = 0; a < s.length; ) {
-      let l = "", d = a;
-      for (; d < s.length; ) {
-        const m = l + (l ? " " : "") + s[d];
-        if (this.estimateTokens(m.replace(/\s*\n\s*/g, `
-`)) > e && l) break;
-        l = m, d++;
+    for (let a = 0; a < n.length; ) {
+      let m = "", d = a;
+      for (; d < n.length; ) {
+        const l = m + (m ? " " : "") + n[d];
+        if (this.estimateTokens(l.replace(/\s*\n\s*/g, `
+`)) > e && m) break;
+        m = l, d++;
       }
-      const c = l.replace(/\s*\n\s*/g, `
+      const c = m.replace(/\s*\n\s*/g, `
 `).trim();
       c && o.push(c), a = Math.max(d - t, d === a ? a + 1 : d);
     }
@@ -380,20 +382,20 @@ ${l.map((u) => `${u.role}: ${u.content}`).join(`
    * @returns {Promise<Awaited<{index: number, embedding: number[], text: string, tokens: number}>[]>} Chunked embeddings
    */
   embedding(r, e = 500, t = 50) {
-    const i = (s) => new Promise((o, a) => {
-      const l = this.embedId++;
-      this.embedQueue.set(l, { resolve: o, reject: a }), this.embedWorker?.postMessage({
-        id: l,
-        text: s,
+    const i = (n) => new Promise((o, a) => {
+      const m = this.embedId++;
+      this.embedQueue.set(m, { resolve: o, reject: a }), this.embedWorker?.postMessage({
+        id: m,
+        text: n,
         model: this.ai.options?.embedder || "bge-small-en-v1.5",
         path: this.ai.options.path
       });
-    }), n = this.chunk(r, e, t);
-    return Promise.all(n.map(async (s, o) => ({
+    }), s = this.chunk(r, e, t);
+    return Promise.all(s.map(async (n, o) => ({
       index: o,
-      embedding: await i(s),
-      text: s,
-      tokens: this.estimateTokens(s)
+      embedding: await i(n),
+      text: n,
+      tokens: this.estimateTokens(n)
     })));
   }
   /**
@@ -413,8 +415,8 @@ ${l.map((u) => `${u.role}: ${u.content}`).join(`
    */
   fuzzyMatch(r, ...e) {
     if (e.length < 2) throw new Error("Requires at least 2 strings to compare");
-    const t = (s, o = 10) => s.toLowerCase().split("").map((a, l) => a.charCodeAt(0) * (l + 1) % o / o).slice(0, o), i = t(r), n = e.map((s) => t(s)).map((s) => this.cosineSimilarity(i, s));
-    return { avg: n.reduce((s, o) => s + o, 0) / n.length, max: Math.max(...n), similarities: n };
+    const t = (n, o = 10) => n.toLowerCase().split("").map((a, m) => a.charCodeAt(0) * (m + 1) % o / o).slice(0, o), i = t(r), s = e.map((n) => t(n)).map((n) => this.cosineSimilarity(i, n));
+    return { avg: s.reduce((n, o) => n + o, 0) / s.length, max: Math.max(...s), similarities: s };
   }
   /**
    * Ask a question with JSON response
@@ -425,8 +427,8 @@ ${l.map((u) => `${u.role}: ${u.content}`).join(`
   async json(r, e) {
     let t = await this.ask(r, { system: "Respond using a JSON blob matching any provided examples", ...e });
     if (!t) return {};
-    const i = /```(?:.+)?\s*([\s\S]*?)```/.exec(t), n = i ? i[1].trim() : t;
-    return g(n, {});
+    const i = /```(?:.+)?\s*([\s\S]*?)```/.exec(t), s = i ? i[1].trim() : t;
+    return b(s, {});
   }
   /**
    * Create a summary of some text
@@ -439,7 +441,7 @@ ${l.map((u) => `${u.role}: ${u.content}`).join(`
     return this.ask(r, { system: `Generate a brief summary <= ${e} tokens. Output nothing else`, temperature: 0.3, ...t });
   }
 }
-class J {
+class G {
   constructor(r) {
     this.ai = r;
   }
@@ -450,17 +452,17 @@ class J {
     e.forEach((a) => {
       t.has(a.speaker) || t.set(a.speaker, ++i);
     });
-    const n = [];
-    let s = -1, o = "";
+    const s = [];
+    let n = -1, o = "";
     return r.forEach((a) => {
-      const l = a.timestamp[0], d = e.find((m) => l >= m.start && l <= m.end), c = d ? t.get(d.speaker) : 1;
-      c !== s ? (o && n.push(`[speaker ${s}]: ${o.trim()}`), s = c, o = a.text) : o += a.text;
-    }), o && n.push(`[speaker ${s}]: ${o.trim()}`), n.join(`
+      const m = a.timestamp[0], d = e.find((l) => m >= l.start && m <= l.end), c = d ? t.get(d.speaker) : 1;
+      c !== n ? (o && s.push(`[speaker ${n}]: ${o.trim()}`), n = c, o = a.text) : o += a.text;
+    }), o && s.push(`[speaker ${n}]: ${o.trim()}`), s.join(`
 `);
   }
   async canDiarization() {
     return new Promise((r) => {
-      const e = w("python3", ["-c", "import pyannote.audio"]);
+      const e = k("python3", ["-c", "import pyannote.audio"]);
       e.on("close", (t) => r(t === 0)), e.on("error", () => r(!1));
     });
   }
@@ -486,43 +488,54 @@ for turn, _, speaker in diarization.itertracks(yield_label=True):
 print(json.dumps(segments))
 `;
     return new Promise((t, i) => {
-      let n = "";
-      const s = w("python3", ["-c", e, r]);
-      s.stdout.on("data", (o) => n += o.toString()), s.stderr.on("data", (o) => console.error(o.toString())), s.on("close", (o) => {
+      let s = "";
+      const n = k("python3", ["-c", e, r]);
+      n.stdout.on("data", (o) => s += o.toString()), n.stderr.on("data", (o) => console.error(o.toString())), n.on("close", (o) => {
         if (o === 0)
           try {
-            t(JSON.parse(n));
+            t(JSON.parse(s));
           } catch {
             i(new Error("Failed to parse diarization output"));
           }
         else
           i(new Error(`Python process exited with code ${o}`));
-      }), s.on("error", i);
+      }), n.on("error", i);
     });
   }
   asr(r, e = {}) {
     const { model: t = this.ai.options.asr || "whisper-base", speaker: i = !1 } = e;
-    let n = !1;
-    const s = () => {
-      n = !0;
-    }, o = new Promise(async (a, l) => {
+    let s = !1;
+    const n = () => {
+      s = !0;
+    }, o = new Promise(async (a, m) => {
       try {
-        if (n || (this.whisperPipeline || (this.whisperPipeline = await z("automatic-speech-recognition", `Xenova/${t}`, { cache_dir: this.ai.options.path, quantized: !0 })), n)) return a(null);
-        const d = await L(r, 16e3), c = await this.whisperPipeline(d, { return_timestamps: i ? "word" : !1, chunk_length_s: 30 });
-        if (!i) return a(c.text?.trim() || null);
-        if (n) return a(null);
-        const m = await this.runDiarization(r);
-        if (n) return a(null);
-        const h = this.combineSpeakerTranscript(c.chunks || [], m);
-        a(h);
+        if (s || (this.whisperPipeline || (this.whisperPipeline = await N("automatic-speech-recognition", `Xenova/${t}`, { cache_dir: this.ai.options.path, quantized: !0 })), s)) return a(null);
+        const d = new C.WaveFile(W.readFileSync(r));
+        d.toBitDepth("32f"), d.toSampleRate(16e3);
+        const c = d.getSamples();
+        let l;
+        if (Array.isArray(c)) {
+          const y = c[0], T = c[1];
+          l = new Float32Array(y.length);
+          for (let g = 0; g < y.length; g++) l[g] = (y[g] + T[g]) / 2;
+        } else
+          l = c;
+        if (s) return a(null);
+        const h = await this.whisperPipeline(l, { return_timestamps: i ? "word" : !1 });
+        if (!i) return a(h.text?.trim() || null);
+        if (s) return a(null);
+        const u = await this.runDiarization(r);
+        if (s) return a(null);
+        const f = this.combineSpeakerTranscript(h.chunks || [], u);
+        a(f);
       } catch (d) {
-        l(d);
+        m(d);
       }
     });
-    return Object.assign(o, { abort: s });
+    return Object.assign(o, { abort: n });
   }
 }
-class F {
+class Q {
   constructor(r) {
     this.ai = r;
   }
@@ -534,16 +547,16 @@ class F {
   ocr(r) {
     let e;
     const t = new Promise(async (i) => {
-      e = await N(this.ai.options.ocr || "eng", 2, { cachePath: this.ai.options.path });
-      const { data: n } = await e.recognize(r);
-      await e.terminate(), i(n.text.trim() || null);
+      e = await D(this.ai.options.ocr || "eng", 2, { cachePath: this.ai.options.path });
+      const { data: s } = await e.recognize(r);
+      await e.terminate(), i(s.text.trim() || null);
     });
     return Object.assign(t, { abort: () => e?.terminate() });
   }
 }
-class ie {
+class me {
   constructor(r) {
-    this.options = r, r.path || (r.path = j.tmpdir()), process.env.TRANSFORMERS_CACHE = r.path, this.audio = new J(this), this.language = new H(this), this.vision = new F(this);
+    this.options = r, r.path || (r.path = P.tmpdir()), process.env.TRANSFORMERS_CACHE = r.path, this.audio = new G(this), this.language = new B(this), this.vision = new Q(this);
   }
   /** Audio processing AI */
   audio;
@@ -552,17 +565,17 @@ class ie {
   /** Vision processing AI */
   vision;
 }
-const G = {
+const K = {
   name: "cli",
   description: "Use the command line interface, returns any output",
   args: { command: { type: "string", description: "Command to run", required: !0 } },
-  fn: (p) => W`${p.command}`
-}, ae = {
+  fn: (p) => F`${p.command}`
+}, de = {
   name: "get_datetime",
   description: "Get current UTC date / time",
   args: {},
   fn: async () => (/* @__PURE__ */ new Date()).toUTCString()
-}, ce = {
+}, ue = {
   name: "exec",
   description: "Run code/scripts",
   args: {
@@ -573,17 +586,17 @@ const G = {
     try {
       switch (p.type) {
         case "bash":
-          return await G.fn({ command: p.code }, r, e);
+          return await K.fn({ command: p.code }, r, e);
         case "node":
-          return await B.fn({ code: p.code }, r, e);
+          return await V.fn({ code: p.code }, r, e);
         case "python":
-          return await Q.fn({ code: p.code }, r, e);
+          return await X.fn({ code: p.code }, r, e);
       }
     } catch (t) {
       return { error: t?.message || t.toString() };
     }
   }
-}, le = {
+}, pe = {
   name: "fetch",
   description: "Make HTTP request to URL",
   args: {
@@ -592,25 +605,25 @@ const G = {
     headers: { type: "object", description: "HTTP headers to send", default: {} },
     body: { type: "object", description: "HTTP body to send" }
   },
-  fn: (p) => new P({ url: p.url, headers: p.headers }).request({ method: p.method || "GET", body: p.body })
-}, B = {
+  fn: (p) => new $({ url: p.url, headers: p.headers }).request({ method: p.method || "GET", body: p.body })
+}, V = {
   name: "exec_javascript",
   description: "Execute commonjs javascript",
   args: {
     code: { type: "string", description: "CommonJS javascript", required: !0 }
   },
   fn: async (p) => {
-    const r = q(null), e = await $({ console: r }, p.code, !0).catch((t) => r.output.error.push(t));
+    const r = M(null), e = await E({ console: r }, p.code, !0).catch((t) => r.output.error.push(t));
     return { ...r.output, return: e, stdout: void 0, stderr: void 0 };
   }
-}, Q = {
+}, X = {
   name: "exec_javascript",
   description: "Execute commonjs javascript",
   args: {
     code: { type: "string", description: "CommonJS javascript", required: !0 }
   },
-  fn: async (p) => ({ result: D`python -c "${p.code}"` })
-}, me = {
+  fn: async (p) => ({ result: H`python -c "${p.code}"` })
+}, he = {
   name: "read_webpage",
   description: "Extract clean, structured content from a webpage. Use after web_search to read specific URLs",
   args: {
@@ -618,18 +631,18 @@ const G = {
     focus: { type: "string", description: 'Optional: What aspect to focus on (e.g., "pricing", "features", "contact info")' }
   },
   fn: async (p) => {
-    const r = await fetch(p.url, { headers: { "User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64)" } }).then((s) => s.text()).catch((s) => {
-      throw new Error(`Failed to fetch: ${s.message}`);
-    }), e = C.load(r);
+    const r = await fetch(p.url, { headers: { "User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64)" } }).then((n) => n.text()).catch((n) => {
+      throw new Error(`Failed to fetch: ${n.message}`);
+    }), e = I.load(r);
     e('script, style, nav, footer, header, aside, iframe, noscript, [role="navigation"], [role="banner"], .ad, .ads, .cookie, .popup').remove();
     const t = {
       title: e('meta[property="og:title"]').attr("content") || e("title").text() || "",
       description: e('meta[name="description"]').attr("content") || e('meta[property="og:description"]').attr("content") || ""
     };
     let i = "";
-    const n = ["article", "main", '[role="main"]', ".content", ".post", ".entry", "body"];
-    for (const s of n) {
-      const o = e(s).first();
+    const s = ["article", "main", '[role="main"]', ".content", ".post", ".entry", "body"];
+    for (const n of s) {
+      const o = e(n).first();
       if (o.length && o.text().trim().length > 200) {
         i = o.text();
         break;
@@ -637,7 +650,7 @@ const G = {
     }
     return i || (i = e("body").text()), i = i.replace(/\s+/g, " ").trim().slice(0, 8e3), { url: p.url, title: t.title.trim(), description: t.description.trim(), content: i, focus: p.focus };
   }
-}, de = {
+}, fe = {
   name: "web_search",
   description: "Use duckduckgo (anonymous) to find find relevant online resources. Returns a list of URLs that works great with the `read_webpage` tool",
   args: {
@@ -647,30 +660,30 @@ const G = {
   fn: async (p) => {
     const r = await fetch(`https://html.duckduckgo.com/html/?q=${encodeURIComponent(p.query)}`, {
       headers: { "User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64)", "Accept-Language": "en-US,en;q=0.9" }
-    }).then((n) => n.text());
+    }).then((s) => s.text());
     let e, t = /<a .*?href="(.+?)".+?<\/a>/g;
-    const i = new M();
+    const i = new A();
     for (; (e = t.exec(r)) !== null; ) {
-      let n = /uddg=(.+)&amp?/.exec(decodeURIComponent(e[1]))?.[1];
-      if (n && (n = decodeURIComponent(n)), n && i.add(n), i.size >= (p.length || 5)) break;
+      let s = /uddg=(.+)&amp?/.exec(decodeURIComponent(e[1]))?.[1];
+      if (s && (s = decodeURIComponent(s)), s && i.add(s), i.size >= (p.length || 5)) break;
     }
     return i;
   }
 };
 export {
-  ie as Ai,
-  I as Anthropic,
-  J as Audio,
-  G as CliTool,
-  ae as DateTimeTool,
-  ce as ExecTool,
-  le as FetchTool,
-  B as JSTool,
-  S as LLMProvider,
+  me as Ai,
+  J as Anthropic,
+  G as Audio,
+  K as CliTool,
+  de as DateTimeTool,
+  ue as ExecTool,
+  pe as FetchTool,
+  V as JSTool,
+  j as LLMProvider,
   _ as OpenAi,
-  Q as PythonTool,
-  me as ReadWebpageTool,
-  F as Vision,
-  de as WebSearchTool
+  X as PythonTool,
+  he as ReadWebpageTool,
+  Q as Vision,
+  fe as WebSearchTool
 };
 //# sourceMappingURL=index.mjs.map