npm - @livekit/agents - Versions diffs - 0.4.6 → 0.5.0 - Mend

@livekit/agents 0.4.6 → 0.5.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (197) hide show

package/README.md +17 -0
package/dist/audio.cjs +77 -0
package/dist/audio.cjs.map +1 -0
package/dist/audio.js +48 -37
package/dist/audio.js.map +1 -1
package/dist/cli.cjs +131 -0
package/dist/cli.cjs.map +1 -0
package/dist/cli.js +96 -122
package/dist/cli.js.map +1 -1
package/dist/generator.cjs +36 -0
package/dist/generator.cjs.map +1 -0
package/dist/generator.js +8 -22
package/dist/generator.js.map +1 -1
package/dist/http_server.cjs +72 -0
package/dist/http_server.cjs.map +1 -0
package/dist/http_server.d.ts +1 -1
package/dist/http_server.js +44 -47
package/dist/http_server.js.map +1 -1
package/dist/index.cjs +78 -0
package/dist/index.cjs.map +1 -0
package/dist/index.js +26 -28
package/dist/index.js.map +1 -1
package/dist/ipc/job_executor.cjs +33 -0
package/dist/ipc/job_executor.cjs.map +1 -0
package/dist/ipc/job_executor.js +7 -4
package/dist/ipc/job_executor.js.map +1 -1
package/dist/ipc/job_main.cjs +147 -0
package/dist/ipc/job_main.cjs.map +1 -0
package/dist/ipc/job_main.d.ts +1 -1
package/dist/ipc/job_main.js +103 -103
package/dist/ipc/job_main.js.map +1 -1
package/dist/ipc/message.cjs +17 -0
package/dist/ipc/message.cjs.map +1 -0
package/dist/ipc/message.js +0 -1
package/dist/ipc/message.js.map +1 -1
package/dist/ipc/proc_job_executor.cjs +174 -0
package/dist/ipc/proc_job_executor.cjs.map +1 -0
package/dist/ipc/proc_job_executor.js +130 -126
package/dist/ipc/proc_job_executor.js.map +1 -1
package/dist/ipc/proc_pool.cjs +126 -0
package/dist/ipc/proc_pool.cjs.map +1 -0
package/dist/ipc/proc_pool.js +93 -96
package/dist/ipc/proc_pool.js.map +1 -1
package/dist/job.cjs +230 -0
package/dist/job.cjs.map +1 -0
package/dist/job.js +195 -198
package/dist/job.js.map +1 -1
package/dist/llm/chat_context.cjs +131 -0
package/dist/llm/chat_context.cjs.map +1 -0
package/dist/llm/chat_context.js +98 -86
package/dist/llm/chat_context.js.map +1 -1
package/dist/llm/function_context.cjs +103 -0
package/dist/llm/function_context.cjs.map +1 -0
package/dist/llm/function_context.js +72 -81
package/dist/llm/function_context.js.map +1 -1
package/dist/llm/function_context.test.cjs +218 -0
package/dist/llm/function_context.test.cjs.map +1 -0
package/dist/llm/function_context.test.js +209 -210
package/dist/llm/function_context.test.js.map +1 -1
package/dist/llm/index.cjs +43 -0
package/dist/llm/index.cjs.map +1 -0
package/dist/llm/index.js +22 -6
package/dist/llm/index.js.map +1 -1
package/dist/llm/llm.cjs +76 -0
package/dist/llm/llm.cjs.map +1 -0
package/dist/llm/llm.js +48 -42
package/dist/llm/llm.js.map +1 -1
package/dist/log.cjs +57 -0
package/dist/log.cjs.map +1 -0
package/dist/log.js +27 -26
package/dist/log.js.map +1 -1
package/dist/multimodal/agent_playout.cjs +228 -0
package/dist/multimodal/agent_playout.cjs.map +1 -0
package/dist/multimodal/agent_playout.d.ts +1 -1
package/dist/multimodal/agent_playout.js +193 -180
package/dist/multimodal/agent_playout.js.map +1 -1
package/dist/multimodal/index.cjs +25 -0
package/dist/multimodal/index.cjs.map +1 -0
package/dist/multimodal/index.js +2 -5
package/dist/multimodal/index.js.map +1 -1
package/dist/multimodal/multimodal_agent.cjs +404 -0
package/dist/multimodal/multimodal_agent.cjs.map +1 -0
package/dist/multimodal/multimodal_agent.d.ts +1 -1
package/dist/multimodal/multimodal_agent.js +351 -330
package/dist/multimodal/multimodal_agent.js.map +1 -1
package/dist/pipeline/agent_output.cjs +172 -0
package/dist/pipeline/agent_output.cjs.map +1 -0
package/dist/pipeline/agent_output.js +136 -138
package/dist/pipeline/agent_output.js.map +1 -1
package/dist/pipeline/agent_playout.cjs +169 -0
package/dist/pipeline/agent_playout.cjs.map +1 -0
package/dist/pipeline/agent_playout.js +126 -136
package/dist/pipeline/agent_playout.js.map +1 -1
package/dist/pipeline/human_input.cjs +158 -0
package/dist/pipeline/human_input.cjs.map +1 -0
package/dist/pipeline/human_input.js +124 -125
package/dist/pipeline/human_input.js.map +1 -1
package/dist/pipeline/index.cjs +31 -0
package/dist/pipeline/index.cjs.map +1 -0
package/dist/pipeline/index.js +8 -4
package/dist/pipeline/index.js.map +1 -1
package/dist/pipeline/pipeline_agent.cjs +642 -0
package/dist/pipeline/pipeline_agent.cjs.map +1 -0
package/dist/pipeline/pipeline_agent.js +595 -651
package/dist/pipeline/pipeline_agent.js.map +1 -1
package/dist/pipeline/speech_handle.cjs +128 -0
package/dist/pipeline/speech_handle.cjs.map +1 -0
package/dist/pipeline/speech_handle.js +102 -100
package/dist/pipeline/speech_handle.js.map +1 -1
package/dist/plugin.cjs +46 -0
package/dist/plugin.cjs.map +1 -0
package/dist/plugin.js +20 -20
package/dist/plugin.js.map +1 -1
package/dist/stt/index.cjs +38 -0
package/dist/stt/index.cjs.map +1 -0
package/dist/stt/index.js +13 -5
package/dist/stt/index.js.map +1 -1
package/dist/stt/stream_adapter.cjs +87 -0
package/dist/stt/stream_adapter.cjs.map +1 -0
package/dist/stt/stream_adapter.js +58 -55
package/dist/stt/stream_adapter.js.map +1 -1
package/dist/stt/stt.cjs +98 -0
package/dist/stt/stt.cjs.map +1 -0
package/dist/stt/stt.js +63 -98
package/dist/stt/stt.js.map +1 -1
package/dist/tokenize/basic/basic.cjs +98 -0
package/dist/tokenize/basic/basic.cjs.map +1 -0
package/dist/tokenize/basic/basic.js +56 -45
package/dist/tokenize/basic/basic.js.map +1 -1
package/dist/tokenize/basic/hyphenator.cjs +425 -0
package/dist/tokenize/basic/hyphenator.cjs.map +1 -0
package/dist/tokenize/basic/hyphenator.js +66 -82
package/dist/tokenize/basic/hyphenator.js.map +1 -1
package/dist/tokenize/basic/index.cjs +35 -0
package/dist/tokenize/basic/index.cjs.map +1 -0
package/dist/tokenize/basic/index.js +7 -4
package/dist/tokenize/basic/index.js.map +1 -1
package/dist/tokenize/basic/paragraph.cjs +57 -0
package/dist/tokenize/basic/paragraph.cjs.map +1 -0
package/dist/tokenize/basic/paragraph.js +30 -35
package/dist/tokenize/basic/paragraph.js.map +1 -1
package/dist/tokenize/basic/sentence.cjs +83 -0
package/dist/tokenize/basic/sentence.cjs.map +1 -0
package/dist/tokenize/basic/sentence.js +56 -57
package/dist/tokenize/basic/sentence.js.map +1 -1
package/dist/tokenize/basic/word.cjs +44 -0
package/dist/tokenize/basic/word.cjs.map +1 -0
package/dist/tokenize/basic/word.js +17 -20
package/dist/tokenize/basic/word.js.map +1 -1
package/dist/tokenize/index.cjs +55 -0
package/dist/tokenize/index.cjs.map +1 -0
package/dist/tokenize/index.js +18 -7
package/dist/tokenize/index.js.map +1 -1
package/dist/tokenize/token_stream.cjs +164 -0
package/dist/tokenize/token_stream.cjs.map +1 -0
package/dist/tokenize/token_stream.js +133 -139
package/dist/tokenize/token_stream.js.map +1 -1
package/dist/tokenize/tokenizer.cjs +184 -0
package/dist/tokenize/tokenizer.cjs.map +1 -0
package/dist/tokenize/tokenizer.js +138 -99
package/dist/tokenize/tokenizer.js.map +1 -1
package/dist/transcription.cjs +131 -0
package/dist/transcription.cjs.map +1 -0
package/dist/transcription.js +99 -96
package/dist/transcription.js.map +1 -1
package/dist/tts/index.cjs +38 -0
package/dist/tts/index.cjs.map +1 -0
package/dist/tts/index.js +13 -5
package/dist/tts/index.js.map +1 -1
package/dist/tts/stream_adapter.cjs +78 -0
package/dist/tts/stream_adapter.cjs.map +1 -0
package/dist/tts/stream_adapter.js +50 -47
package/dist/tts/stream_adapter.js.map +1 -1
package/dist/tts/tts.cjs +127 -0
package/dist/tts/tts.cjs.map +1 -0
package/dist/tts/tts.js +90 -120
package/dist/tts/tts.js.map +1 -1
package/dist/utils.cjs +284 -0
package/dist/utils.cjs.map +1 -0
package/dist/utils.js +242 -247
package/dist/utils.js.map +1 -1
package/dist/vad.cjs +92 -0
package/dist/vad.cjs.map +1 -0
package/dist/vad.js +57 -52
package/dist/vad.js.map +1 -1
package/dist/version.cjs +29 -0
package/dist/version.cjs.map +1 -0
package/dist/version.js +4 -4
package/dist/version.js.map +1 -1
package/dist/worker.cjs +576 -0
package/dist/worker.cjs.map +1 -0
package/dist/worker.d.ts +1 -1
package/dist/worker.js +511 -484
package/dist/worker.js.map +1 -1
package/package.json +18 -8
package/src/ipc/job_main.ts +66 -64
package/src/pipeline/pipeline_agent.ts +23 -23

package/dist/tokenize/basic/basic.cjs ADDED Viewed

@@ -0,0 +1,98 @@
+"use strict";
+var __create = Object.create;
+var __defProp = Object.defineProperty;
+var __getOwnPropDesc = Object.getOwnPropertyDescriptor;
+var __getOwnPropNames = Object.getOwnPropertyNames;
+var __getProtoOf = Object.getPrototypeOf;
+var __hasOwnProp = Object.prototype.hasOwnProperty;
+var __export = (target, all) => {
+  for (var name in all)
+    __defProp(target, name, { get: all[name], enumerable: true });
+};
+var __copyProps = (to, from, except, desc) => {
+  if (from && typeof from === "object" || typeof from === "function") {
+    for (let key of __getOwnPropNames(from))
+      if (!__hasOwnProp.call(to, key) && key !== except)
+        __defProp(to, key, { get: () => from[key], enumerable: !(desc = __getOwnPropDesc(from, key)) || desc.enumerable });
+  }
+  return to;
+};
+var __toESM = (mod, isNodeMode, target) => (target = mod != null ? __create(__getProtoOf(mod)) : {}, __copyProps(
+  // If the importer is in node compatibility mode or this is not an ESM
+  // file that has been converted to a CommonJS file using a Babel-
+  // compatible transform (i.e. "__esModule" has not been set), then set
+  // "default" to the CommonJS "module.exports" for node compatibility.
+  isNodeMode || !mod || !mod.__esModule ? __defProp(target, "default", { value: mod, enumerable: true }) : target,
+  mod
+));
+var __toCommonJS = (mod) => __copyProps(__defProp({}, "__esModule", { value: true }), mod);
+var basic_exports = {};
+__export(basic_exports, {
+  SentenceTokenizer: () => SentenceTokenizer,
+  WordTokenizer: () => WordTokenizer,
+  hyphenateWord: () => hyphenateWord,
+  tokenizeParagraphs: () => tokenizeParagraphs
+});
+module.exports = __toCommonJS(basic_exports);
+var tokenizer = __toESM(require("../index.cjs"), 1);
+var import_token_stream = require("../token_stream.cjs");
+var import_hyphenator = require("./hyphenator.cjs");
+var import_paragraph = require("./paragraph.cjs");
+var import_sentence = require("./sentence.cjs");
+var import_word = require("./word.cjs");
+class SentenceTokenizer extends tokenizer.SentenceTokenizer {
+  #config;
+  constructor(language = "en-US", minSentenceLength = 20, streamContextLength = 10) {
+    super();
+    this.#config = {
+      language,
+      minSentenceLength,
+      streamContextLength
+    };
+  }
+  // eslint-disable-next-line @typescript-eslint/no-unused-vars
+  tokenize(text, language) {
+    return (0, import_sentence.splitSentences)(text, this.#config.minSentenceLength).map((tok) => tok[0]);
+  }
+  // eslint-disable-next-line @typescript-eslint/no-unused-vars
+  stream(language) {
+    return new import_token_stream.BufferedSentenceStream(
+      (text) => (0, import_sentence.splitSentences)(text, this.#config.minSentenceLength),
+      this.#config.minSentenceLength,
+      this.#config.streamContextLength
+    );
+  }
+}
+class WordTokenizer extends tokenizer.WordTokenizer {
+  #ignorePunctuation;
+  constructor(ignorePunctuation = true) {
+    super();
+    this.#ignorePunctuation = ignorePunctuation;
+  }
+  // eslint-disable-next-line @typescript-eslint/no-unused-vars
+  tokenize(text, language) {
+    return (0, import_word.splitWords)(text, this.#ignorePunctuation).map((tok) => tok[0]);
+  }
+  // eslint-disable-next-line @typescript-eslint/no-unused-vars
+  stream(language) {
+    return new import_token_stream.BufferedWordStream(
+      (text) => (0, import_word.splitWords)(text, this.#ignorePunctuation),
+      1,
+      1
+    );
+  }
+}
+const hyphenateWord = (word) => {
+  return import_hyphenator.hyphenator.hyphenateWord(word);
+};
+const tokenizeParagraphs = (text) => {
+  return (0, import_paragraph.splitParagraphs)(text).map((tok) => tok[0]);
+};
+// Annotate the CommonJS export names for ESM import in node:
+0 && (module.exports = {
+  SentenceTokenizer,
+  WordTokenizer,
+  hyphenateWord,
+  tokenizeParagraphs
+});
+//# sourceMappingURL=basic.cjs.map

package/dist/tokenize/basic/basic.cjs.map ADDED Viewed

@@ -0,0 +1 @@

+ {"version":3,"sources":["../../../src/tokenize/basic/basic.ts"],"sourcesContent":["// SPDX-FileCopyrightText: 2024 LiveKit, Inc.\n//\n// SPDX-License-Identifier: Apache-2.0\nimport * as tokenizer from '../index.js';\nimport { BufferedSentenceStream, BufferedWordStream } from '../token_stream.js';\nimport { hyphenator } from './hyphenator.js';\nimport { splitParagraphs } from './paragraph.js';\nimport { splitSentences } from './sentence.js';\nimport { splitWords } from './word.js';\n\ninterface TokenizerOptions {\n language: string;\n minSentenceLength: number;\n streamContextLength: number;\n}\n\nexport class SentenceTokenizer extends tokenizer.SentenceTokenizer {\n #config: TokenizerOptions;\n\n constructor(language = 'en-US', minSentenceLength = 20, streamContextLength = 10) {\n super();\n this.#config = {\n language,\n minSentenceLength,\n streamContextLength,\n };\n }\n\n // eslint-disable-next-line @typescript-eslint/no-unused-vars\n tokenize(text: string, language?: string): string[] {\n return splitSentences(text, this.#config.minSentenceLength).map((tok) => tok[0]);\n }\n\n // eslint-disable-next-line @typescript-eslint/no-unused-vars\n stream(language?: string): tokenizer.SentenceStream {\n return new BufferedSentenceStream(\n (text: string) => splitSentences(text, this.#config.minSentenceLength),\n this.#config.minSentenceLength,\n this.#config.streamContextLength,\n );\n }\n}\n\nexport class WordTokenizer extends tokenizer.WordTokenizer {\n #ignorePunctuation: boolean;\n\n constructor(ignorePunctuation = true) {\n super();\n this.#ignorePunctuation = ignorePunctuation;\n }\n\n // eslint-disable-next-line @typescript-eslint/no-unused-vars\n tokenize(text: string, language?: string): string[] {\n return splitWords(text, this.#ignorePunctuation).map((tok) => tok[0]);\n }\n\n // eslint-disable-next-line @typescript-eslint/no-unused-vars\n stream(language?: string): tokenizer.WordStream {\n return new BufferedWordStream(\n (text: string) => splitWords(text, this.#ignorePunctuation),\n 1,\n 1,\n );\n }\n}\n\nexport const hyphenateWord = (word: string): string[] => {\n return hyphenator.hyphenateWord(word);\n};\n\nexport const tokenizeParagraphs = (text: string): string[] => {\n return splitParagraphs(text).map((tok) => tok[0]);\n};\n"],"mappings":";;;;;;;;;;;;;;;;;;;;;;;;;;;;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAGA,gBAA2B;AAC3B,0BAA2D;AAC3D,wBAA2B;AAC3B,uBAAgC;AAChC,sBAA+B;AAC/B,kBAA2B;AAQpB,MAAM,0BAA0B,UAAU,kBAAkB;AAAA,EACjE;AAAA,EAEA,YAAY,WAAW,SAAS,oBAAoB,IAAI,sBAAsB,IAAI;AAChF,UAAM;AACN,SAAK,UAAU;AAAA,MACb;AAAA,MACA;AAAA,MACA;AAAA,IACF;AAAA,EACF;AAAA;AAAA,EAGA,SAAS,MAAc,UAA6B;AAClD,eAAO,gCAAe,MAAM,KAAK,QAAQ,iBAAiB,EAAE,IAAI,CAAC,QAAQ,IAAI,CAAC,CAAC;AAAA,EACjF;AAAA;AAAA,EAGA,OAAO,UAA6C;AAClD,WAAO,IAAI;AAAA,MACT,CAAC,aAAiB,gCAAe,MAAM,KAAK,QAAQ,iBAAiB;AAAA,MACrE,KAAK,QAAQ;AAAA,MACb,KAAK,QAAQ;AAAA,IACf;AAAA,EACF;AACF;AAEO,MAAM,sBAAsB,UAAU,cAAc;AAAA,EACzD;AAAA,EAEA,YAAY,oBAAoB,MAAM;AACpC,UAAM;AACN,SAAK,qBAAqB;AAAA,EAC5B;AAAA;AAAA,EAGA,SAAS,MAAc,UAA6B;AAClD,eAAO,wBAAW,MAAM,KAAK,kBAAkB,EAAE,IAAI,CAAC,QAAQ,IAAI,CAAC,CAAC;AAAA,EACtE;AAAA;AAAA,EAGA,OAAO,UAAyC;AAC9C,WAAO,IAAI;AAAA,MACT,CAAC,aAAiB,wBAAW,MAAM,KAAK,kBAAkB;AAAA,MAC1D;AAAA,MACA;AAAA,IACF;AAAA,EACF;AACF;AAEO,MAAM,gBAAgB,CAAC,SAA2B;AACvD,SAAO,6BAAW,cAAc,IAAI;AACtC;AAEO,MAAM,qBAAqB,CAAC,SAA2B;AAC5D,aAAO,kCAAgB,IAAI,EAAE,IAAI,CAAC,QAAQ,IAAI,CAAC,CAAC;AAClD;","names":[]}

package/dist/tokenize/basic/basic.js CHANGED Viewed

@@ -1,50 +1,61 @@
-// SPDX-FileCopyrightText: 2024 LiveKit, Inc.
-//
-// SPDX-License-Identifier: Apache-2.0
-import * as tokenizer from '../index.js';
-import { BufferedSentenceStream, BufferedWordStream } from '../token_stream.js';
-import { hyphenator } from './hyphenator.js';
-import { splitParagraphs } from './paragraph.js';
-import { splitSentences } from './sentence.js';
-import { splitWords } from './word.js';
-export class SentenceTokenizer extends tokenizer.SentenceTokenizer {
-    #config;
-    constructor(language = 'en-US', minSentenceLength = 20, streamContextLength = 10) {
-        super();
-        this.#config = {
-            language,
-            minSentenceLength,
-            streamContextLength,
-        };
-    }
-    // eslint-disable-next-line @typescript-eslint/no-unused-vars
-    tokenize(text, language) {
-        return splitSentences(text, this.#config.minSentenceLength).map((tok) => tok[0]);
-    }
-    // eslint-disable-next-line @typescript-eslint/no-unused-vars
-    stream(language) {
-        return new BufferedSentenceStream((text) => splitSentences(text, this.#config.minSentenceLength), this.#config.minSentenceLength, this.#config.streamContextLength);
-    }
+import * as tokenizer from "../index.js";
+import { BufferedSentenceStream, BufferedWordStream } from "../token_stream.js";
+import { hyphenator } from "./hyphenator.js";
+import { splitParagraphs } from "./paragraph.js";
+import { splitSentences } from "./sentence.js";
+import { splitWords } from "./word.js";
+class SentenceTokenizer extends tokenizer.SentenceTokenizer {
+  #config;
+  constructor(language = "en-US", minSentenceLength = 20, streamContextLength = 10) {
+    super();
+    this.#config = {
+      language,
+      minSentenceLength,
+      streamContextLength
+    };
+  }
+  // eslint-disable-next-line @typescript-eslint/no-unused-vars
+  tokenize(text, language) {
+    return splitSentences(text, this.#config.minSentenceLength).map((tok) => tok[0]);
+  }
+  // eslint-disable-next-line @typescript-eslint/no-unused-vars
+  stream(language) {
+    return new BufferedSentenceStream(
+      (text) => splitSentences(text, this.#config.minSentenceLength),
+      this.#config.minSentenceLength,
+      this.#config.streamContextLength
+    );
+  }
 }
-export class WordTokenizer extends tokenizer.WordTokenizer {
-    #ignorePunctuation;
-    constructor(ignorePunctuation = true) {
-        super();
-        this.#ignorePunctuation = ignorePunctuation;
-    }
-    // eslint-disable-next-line @typescript-eslint/no-unused-vars
-    tokenize(text, language) {
-        return splitWords(text, this.#ignorePunctuation).map((tok) => tok[0]);
-    }
-    // eslint-disable-next-line @typescript-eslint/no-unused-vars
-    stream(language) {
-        return new BufferedWordStream((text) => splitWords(text, this.#ignorePunctuation), 1, 1);
-    }
+class WordTokenizer extends tokenizer.WordTokenizer {
+  #ignorePunctuation;
+  constructor(ignorePunctuation = true) {
+    super();
+    this.#ignorePunctuation = ignorePunctuation;
+  }
+  // eslint-disable-next-line @typescript-eslint/no-unused-vars
+  tokenize(text, language) {
+    return splitWords(text, this.#ignorePunctuation).map((tok) => tok[0]);
+  }
+  // eslint-disable-next-line @typescript-eslint/no-unused-vars
+  stream(language) {
+    return new BufferedWordStream(
+      (text) => splitWords(text, this.#ignorePunctuation),
+      1,
+      1
+    );
+  }
 }
-export const hyphenateWord = (word) => {
-    return hyphenator.hyphenateWord(word);
+const hyphenateWord = (word) => {
+  return hyphenator.hyphenateWord(word);
 };
-export const tokenizeParagraphs = (text) => {
-    return splitParagraphs(text).map((tok) => tok[0]);
+const tokenizeParagraphs = (text) => {
+  return splitParagraphs(text).map((tok) => tok[0]);
+};
+export {
+  SentenceTokenizer,
+  WordTokenizer,
+  hyphenateWord,
+  tokenizeParagraphs
 };
 //# sourceMappingURL=basic.js.map

package/dist/tokenize/basic/basic.js.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"~~file":"basic.js","sourceRoot":"","~~sources":["../../../src/tokenize/basic/basic.ts"],"~~names~~":[],"~~mappings"~~:~~"AAAA~~,~~6CAA6C;AAC7C~~,~~EAAE;AACF~~,~~sCAAsC;AACtC~~,~~OAAO~~,~~KAAK~~,~~SAAS~~,~~MAAM~~,~~aAAa~~,~~CAAC;AACzC~~,~~OAAO~~,~~EAAE~~,~~sBAAsB~~,~~EAAE~~,~~kBAAkB~~,~~EAAE~~,~~MAAM,oBAAoB,CAAC~~;~~AAChF~~,~~OAAO~~,~~EAAE,UAAU,EAAE,MAAM,iBAAiB,CAAC~~;~~AAC7C~~,~~OAAO~~,~~EAAE,eAAe,EAAE,MAAM,gBAAgB,CAAC~~;~~AACjD~~,~~OAAO~~,~~EAAE,cAAc,EAAE,MAAM,eAAe,CAAC~~;AAC/C,~~OAAO~~,~~EAAE,UAAU,EAAE,MAAM,WAAW,CAAC~~;~~AAQvC~~,MAAM,~~OAAO~~,~~iBAAkB~~,~~SAAQ~~,~~SAAS,CAAC,iBAAiB~~;~~IAChE~~,~~OAAO~~,~~CAAmB;IAE1B,~~YAAY,~~QAAQ~~,~~GAAG~~,~~OAAO~~,~~EAAE~~,~~iBAAiB~~,~~GAAG,EAAE,EAAE,mBAAmB,GAAG,EAAE~~;~~QAC9E~~,~~KAAK,EAAE,CAAC~~;~~QACR~~,~~IAAI~~,~~CAAC,OAAO,GAAG~~;~~YACb~~,~~QAAQ~~;~~YACR~~,~~iBAAiB~~;~~YACjB~~,~~mBAAmB~~;~~SACpB~~,~~CAAC~~;~~IACJ~~,~~CAAC~~;~~IAED,6DAA6D~~;~~IAC7D~~,~~QAAQ~~,~~CAAC~~,~~IAAY~~,~~EAAE,QAAiB~~;~~QACtC~~,~~OAAO~~,~~cAAc~~,~~CAAC~~,~~IAAI~~,~~EAAE~~,~~IAAI,CAAC,OAAO,CAAC,~~iBAAiB,~~CAAC,CAAC,GAAG,CAAC,CAAC,GAAG,~~EAAE,~~EAAE~~,CAAC,~~GAAG~~,~~CAAC~~,CAAC,CAAC~~,CAAC,CAAC~~;~~IACnF~~,~~CAAC~~;~~IAED,6DAA6D~~;~~IAC7D~~,~~MAAM~~,~~CAAC~~,~~QAAiB~~;~~QACtB~~,~~OAAO~~,IAAI,~~sBAAsB~~,~~CAC/B,~~CAAC,~~IAAY~~,~~EAAE~~,~~EAAE~~,~~CAAC~~,~~cAAc~~,~~CAAC,IAAI,EAAE,IAAI,CAAC,OAAO,CAAC,~~iBAAiB,~~CAAC~~,~~EACtE~~,~~IAAI~~,~~CAAC~~,~~OAAO~~,~~CAAC~~,~~iBAAiB,EAC9B,IAAI,CAAC,OAAO,CAAC,mBAAmB,CACjC,CAAC~~;~~IACJ~~,~~CAAC~~;~~CACF~~;~~AAED~~,MAAM,~~OAAO~~,~~aAAc~~,~~SAAQ~~,~~SAAS,CAAC,aAAa~~;~~IACxD~~,~~kBAAkB~~,~~CAAU;IAE5B,~~YAAY,~~iBAAiB~~,~~GAAG,IAAI~~;~~QAClC~~,~~KAAK,EAAE,CAAC~~;~~QACR~~,~~IAAI~~,~~CAAC,kBAAkB,GAAG,iBAAiB,CAAC~~;~~IAC9C~~,~~CAAC~~;~~IAED,6DAA6D~~;~~IAC7D~~,~~QAAQ~~,~~CAAC~~,~~IAAY~~,~~EAAE,QAAiB~~;~~QACtC~~,~~OAAO~~,~~UAAU~~,~~CAAC~~,~~IAAI~~,~~EAAE,IAAI,CAAC,~~kBAAkB,~~CAAC,CAAC,GAAG,CAAC,CAAC,GAAG,~~EAAE,~~EAAE~~,CAAC,~~GAAG~~,~~CAAC~~,CAAC,CAAC~~,CAAC,CAAC~~;~~IACxE~~,~~CAAC~~;~~IAED,6DAA6D~~;~~IAC7D~~,~~MAAM~~,~~CAAC~~,~~QAAiB~~;~~QACtB~~,~~OAAO~~,IAAI,~~kBAAkB~~,~~CAC3B,~~CAAC,~~IAAY~~,~~EAAE~~,~~EAAE~~,~~CAAC~~,~~UAAU,CAAC,IAAI,EAAE,IAAI,CAAC,~~kBAAkB,~~CAAC~~,~~EAC3D~~,~~CAAC,EACD,CAAC,CACF,CAAC~~;~~IACJ~~,~~CAAC~~;~~CACF~~;~~AAED~~,MAAM,~~CAAC~~,~~MAAM,aAAa,GAAG,~~CAAC,~~IAAY,EAAY,EAAE~~;~~IACtD~~,~~OAAO~~,~~UAAU~~,~~CAAC~~,~~aAAa,CAAC,~~IAAI~~,CAAC,CAAC~~;~~AACxC,CAAC,CAAC~~;~~AAEF~~,MAAM,~~CAAC~~,~~MAAM,kBAAkB,GAAG,~~CAAC,~~IAAY,EAAY,EAAE~~;~~IAC3D~~,~~OAAO~~,~~eAAe~~,~~CAAC,~~IAAI,~~CAAC,CAAC,GAAG,CAAC,CAAC,GAAG,~~EAAE,~~EAAE~~,CAAC,~~GAAG~~,~~CAAC~~,CAAC,CAAC~~,CAAC,CAAC~~;~~AACpD~~,~~CAAC,CAAC~~"}
1	+ {"version":3,"sources":["../../../src/tokenize/basic/basic.ts"],"sourcesContent":["// SPDX-FileCopyrightText: 2024 LiveKit, Inc.\n//\n// SPDX-License-Identifier: Apache-2.0\nimport * as tokenizer from '../index.js';\nimport { BufferedSentenceStream, BufferedWordStream } from '../token_stream.js';\nimport { hyphenator } from './hyphenator.js';\nimport { splitParagraphs } from './paragraph.js';\nimport { splitSentences } from './sentence.js';\nimport { splitWords } from './word.js';\n\ninterface TokenizerOptions {\n language: string;\n minSentenceLength: number;\n streamContextLength: number;\n}\n\nexport class SentenceTokenizer extends tokenizer.SentenceTokenizer {\n #config: TokenizerOptions;\n\n constructor(language = 'en-US', minSentenceLength = 20, streamContextLength = 10) {\n super();\n this.#config = {\n language,\n minSentenceLength,\n streamContextLength,\n };\n }\n\n // eslint-disable-next-line @typescript-eslint/no-unused-vars\n tokenize(text: string, language?: string): string[] {\n return splitSentences(text, this.#config.minSentenceLength).map((tok) => tok[0]);\n }\n\n // eslint-disable-next-line @typescript-eslint/no-unused-vars\n stream(language?: string): tokenizer.SentenceStream {\n return new BufferedSentenceStream(\n (text: string) => splitSentences(text, this.#config.minSentenceLength),\n this.#config.minSentenceLength,\n this.#config.streamContextLength,\n );\n }\n}\n\nexport class WordTokenizer extends tokenizer.WordTokenizer {\n #ignorePunctuation: boolean;\n\n constructor(ignorePunctuation = true) {\n super();\n this.#ignorePunctuation = ignorePunctuation;\n }\n\n // eslint-disable-next-line @typescript-eslint/no-unused-vars\n tokenize(text: string, language?: string): string[] {\n return splitWords(text, this.#ignorePunctuation).map((tok) => tok[0]);\n }\n\n // eslint-disable-next-line @typescript-eslint/no-unused-vars\n stream(language?: string): tokenizer.WordStream {\n return new BufferedWordStream(\n (text: string) => splitWords(text, this.#ignorePunctuation),\n 1,\n 1,\n );\n }\n}\n\nexport const hyphenateWord = (word: string): string[] => {\n return hyphenator.hyphenateWord(word);\n};\n\nexport const tokenizeParagraphs = (text: string): string[] => {\n return splitParagraphs(text).map((tok) => tok[0]);\n};\n"],"mappings":"AAGA,YAAY,eAAe;AAC3B,SAAS,wBAAwB,0BAA0B;AAC3D,SAAS,kBAAkB;AAC3B,SAAS,uBAAuB;AAChC,SAAS,sBAAsB;AAC/B,SAAS,kBAAkB;AAQpB,MAAM,0BAA0B,UAAU,kBAAkB;AAAA,EACjE;AAAA,EAEA,YAAY,WAAW,SAAS,oBAAoB,IAAI,sBAAsB,IAAI;AAChF,UAAM;AACN,SAAK,UAAU;AAAA,MACb;AAAA,MACA;AAAA,MACA;AAAA,IACF;AAAA,EACF;AAAA;AAAA,EAGA,SAAS,MAAc,UAA6B;AAClD,WAAO,eAAe,MAAM,KAAK,QAAQ,iBAAiB,EAAE,IAAI,CAAC,QAAQ,IAAI,CAAC,CAAC;AAAA,EACjF;AAAA;AAAA,EAGA,OAAO,UAA6C;AAClD,WAAO,IAAI;AAAA,MACT,CAAC,SAAiB,eAAe,MAAM,KAAK,QAAQ,iBAAiB;AAAA,MACrE,KAAK,QAAQ;AAAA,MACb,KAAK,QAAQ;AAAA,IACf;AAAA,EACF;AACF;AAEO,MAAM,sBAAsB,UAAU,cAAc;AAAA,EACzD;AAAA,EAEA,YAAY,oBAAoB,MAAM;AACpC,UAAM;AACN,SAAK,qBAAqB;AAAA,EAC5B;AAAA;AAAA,EAGA,SAAS,MAAc,UAA6B;AAClD,WAAO,WAAW,MAAM,KAAK,kBAAkB,EAAE,IAAI,CAAC,QAAQ,IAAI,CAAC,CAAC;AAAA,EACtE;AAAA;AAAA,EAGA,OAAO,UAAyC;AAC9C,WAAO,IAAI;AAAA,MACT,CAAC,SAAiB,WAAW,MAAM,KAAK,kBAAkB;AAAA,MAC1D;AAAA,MACA;AAAA,IACF;AAAA,EACF;AACF;AAEO,MAAM,gBAAgB,CAAC,SAA2B;AACvD,SAAO,WAAW,cAAc,IAAI;AACtC;AAEO,MAAM,qBAAqB,CAAC,SAA2B;AAC5D,SAAO,gBAAgB,IAAI,EAAE,IAAI,CAAC,QAAQ,IAAI,CAAC,CAAC;AAClD;","names":[]}