npm - @mikugg/guidance - Versions diffs - 0.8.0 → 0.10.0 - Mend

@mikugg/guidance 0.8.0 → 0.10.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (15) hide show

package/dist/index.d.ts +3 -3
package/dist/index.d.ts.map +1 -1
package/dist/lib/__test__/template.test.js +20 -3
package/dist/lib/_llama-tokenizer.d.ts.map +1 -1
package/dist/lib/_llama-tokenizer.js +107 -94
package/dist/lib/_trie.js +1 -1
package/dist/lib/template.d.ts +3 -2
package/dist/lib/template.d.ts.map +1 -1
package/dist/lib/template.js +87 -21
package/dist/lib/token-generator.d.ts +6 -4
package/dist/lib/token-generator.d.ts.map +1 -1
package/dist/lib/token-generator.js +52 -14
package/dist/lib/tokenizer.d.ts.map +1 -1
package/dist/lib/tokenizer.js +6 -5
package/package.json +2 -2

package/dist/index.d.ts CHANGED Viewed

@@ -1,5 +1,5 @@
-import * as Tokenizer from './lib/tokenizer';
-import * as TokenGenerator from './lib/token-generator';
-import * as Template from './lib/template';
+import * as Tokenizer from "./lib/tokenizer";
+import * as TokenGenerator from "./lib/token-generator";
+import * as Template from "./lib/template";
 export { Tokenizer, TokenGenerator, Template };
 //# sourceMappingURL=index.d.ts.map

package/dist/index.d.ts.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"index.d.ts","sourceRoot":"","sources":["../src/index.ts"],"names":[],"mappings":"AAAA,OAAO,~~KAAM~~,SAAS,MAAM,iBAAiB,CAAC;~~AAC9C~~,OAAO,KAAK,cAAc,MAAM,uBAAuB,CAAC;AACxD,OAAO,KAAK,QAAQ,MAAM,gBAAgB,CAAC;AAE3C,OAAO,EAAE,SAAS,EAAE,cAAc,EAAE,QAAQ,EAAE,CAAC"}
1	+ {"version":3,"file":"index.d.ts","sourceRoot":"","sources":["../src/index.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,SAAS,MAAM,iBAAiB,CAAC;AAC7C,OAAO,KAAK,cAAc,MAAM,uBAAuB,CAAC;AACxD,OAAO,KAAK,QAAQ,MAAM,gBAAgB,CAAC;AAE3C,OAAO,EAAE,SAAS,EAAE,cAAc,EAAE,QAAQ,EAAE,CAAC"}

package/dist/lib/__test__/template.test.js CHANGED Viewed

@@ -8,6 +8,18 @@ var __awaiter = (this && this.__awaiter) || function (thisArg, _arguments, P, ge
         step((generator = generator.apply(thisArg, _arguments || [])).next());
     });
 };
+var __await = (this && this.__await) || function (v) { return this instanceof __await ? (this.v = v, this) : new __await(v); }
+var __asyncGenerator = (this && this.__asyncGenerator) || function (thisArg, _arguments, generator) {
+    if (!Symbol.asyncIterator) throw new TypeError("Symbol.asyncIterator is not defined.");
+    var g = generator.apply(thisArg, _arguments || []), i, q = [];
+    return i = {}, verb("next"), verb("throw"), verb("return"), i[Symbol.asyncIterator] = function () { return this; }, i;
+    function verb(n) { if (g[n]) i[n] = function (v) { return new Promise(function (a, b) { q.push([n, v, a, b]) > 1 || resume(n, v); }); }; }
+    function resume(n, v) { try { step(g[n](v)); } catch (e) { settle(q[0][3], e); } }
+    function step(r) { r.value instanceof __await ? Promise.resolve(r.value.v).then(fulfill, reject) : settle(q[0][2], r); }
+    function fulfill(value) { resume("next", value); }
+    function reject(value) { resume("throw", value); }
+    function settle(f, v) { if (f(v), q.shift(), q.length) resume(q[0][0], q[0][1]); }
+};
 Object.defineProperty(exports, "__esModule", { value: true });
 const template_1 = require("../template");
 const tokenizer_1 = require("../tokenizer"); // import paths as required
@@ -21,8 +33,8 @@ class MockTokenGenerator extends token_generator_1.AbstractTokenGenerator {
     }
     // eslint-disable-next-line @typescript-eslint/no-unused-vars
     generateString(prompt, options) {
-        return __awaiter(this, void 0, void 0, function* () {
-            return 'generated';
+        return __asyncGenerator(this, arguments, function* generateString_1() {
+            return yield __await('generated');
         });
     }
 }
@@ -69,9 +81,14 @@ describe('TemplateProcessor', () => {
             expect(result.get('weather')).toEqual(' rainy');
         }));
         it('should process template with SEL method in a JSON correctly', () => __awaiter(void 0, void 0, void 0, function* () {
+            const mockGenerateString = function () {
+                return __asyncGenerator(this, arguments, function* () {
+                    yield yield __await('wizard');
+                });
+            };
             // 29879 = "s"
             const spyGenerateToken = jest.spyOn(generator, 'generateToken').mockReturnValue(new Promise((resolve) => resolve("s")));
-            const spyGenerateString = jest.spyOn(generator, 'generateString').mockReturnValue(new Promise((resolve) => resolve("wizard")));
+            const spyGenerateString = jest.spyOn(generator, 'generateString').mockImplementation(mockGenerateString);
             const result = yield templateProcessor.processTemplate(`RPG Game Character specification
         {
           "name": "{{name}}",

package/dist/lib/_llama-tokenizer.d.ts.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"_llama-tokenizer.d.ts","sourceRoot":"","sources":["../../src/lib/_llama-tokenizer.ts"],"names":[],"mappings":"AAEA;;;;;;;;;;;GAWG;AAEH,MAAM,WAAW,cAAc;IAC7B,MAAM,EAAE,~~CACJ~~,IAAI,EAAE,MAAM,EACZ,aAAa,CAAC,EAAE,OAAO,EACvB,mBAAmB,CAAC,EAAE,OAAO,EAC7B,eAAe,CAAC,EAAE,OAAO,~~KACxB~~,MAAM,EAAE,CAAC;IACd,MAAM,EAAE,~~CACJ~~,QAAQ,EAAE,MAAM,EAAE,EAClB,aAAa,CAAC,EAAE,OAAO,EACvB,mBAAmB,CAAC,EAAE,OAAO,~~KAC5B~~,MAAM,~~CAAA~~;~~CACZ~~;AAED,QAAA,MAAM,cAAc,EAAE,cAAmB,~~CAAA~~;~~AA6czC~~,eAAe,cAAc,~~CAAA~~"}
1	+ {"version":3,"file":"_llama-tokenizer.d.ts","sourceRoot":"","sources":["../../src/lib/_llama-tokenizer.ts"],"names":[],"mappings":"AAEA;;;;;;;;;;;GAWG;AAEH,MAAM,WAAW,cAAc;IAC7B,MAAM,EAAE,CACN,IAAI,EAAE,MAAM,EACZ,aAAa,CAAC,EAAE,OAAO,EACvB,mBAAmB,CAAC,EAAE,OAAO,EAC7B,eAAe,CAAC,EAAE,OAAO,KACtB,MAAM,EAAE,CAAC;IACd,MAAM,EAAE,CACN,QAAQ,EAAE,MAAM,EAAE,EAClB,aAAa,CAAC,EAAE,OAAO,EACvB,mBAAmB,CAAC,EAAE,OAAO,KAC1B,MAAM,CAAC;CACb;AAED,QAAA,MAAM,cAAc,EAAE,cAAmB,CAAC;AAqgB1C,eAAe,cAAc,CAAC"}

package/dist/lib/_llama-tokenizer.js CHANGED Viewed

@@ -19,7 +19,9 @@ const base64decode = function (encodedString) {
     return atob(encodedString);
 };
 const getMergeIdentifierString = function (firstTokenId, secondTokenId) {
-    return llamaTokenizer.vocabById[firstTokenId] + " " + llamaTokenizer.vocabById[secondTokenId];
+    return (llamaTokenizer.vocabById[firstTokenId] +
+        " " +
+        llamaTokenizer.vocabById[secondTokenId]);
 };
 const decompressMerges = function (merges_binary) {
     // Base64 decode binary.
@@ -50,46 +52,46 @@ const decompressMerges = function (merges_binary) {
     return merges;
 };
 /**
-* Helper function to decode the vocabulary.
-*
-* vocab_base64 is base64-encoded string of tokens delimited by '\n' (line break) in utf-8.
-* The row number of the token (indexing from 0) represents the id of the token in LLaMA tokenizer.
-*
-* Most tokens look like this: "ic" (without the quotes) (representing the "i" character followed by the "c" character)
-* Some tokens are special. In particular, spaces are replaced with the "▁" character and line-break is represented as "<0x0A>".
-*
-* This helper function returns the vocabulary as an array that contains Strings representing tokens:
-*
-*  "<unk>"   // Special token: unknown token
-*  "<s>"     // Special token: beginning of string
-*  "</s>"    // Special token: end of string
-*  "<0x00>"  // Byte-level token representing the 0-byte
-*  "<0x01>"  // Byte-level token ...
-*  "<0x02>"  // Byte-level token ...
-*  ...       // More byte-level tokens
-*  "<0x0A>"  // Byte-level token representing '\n' (line break). This is one of the few byte-level tokens that appear to be actually needed in practice.
-*  ...       // More byte-level tokens
-*  "<0xFF>"  // Byte-level token ...
-*  "▁▁"     // Token representing 2 consecutive spaces.
-*  "▁t"     // Token representing the space character followed by the "t" character.
-*  "er"      // Token representing the "e" character followed by the "r" character. Most tokens look like this.
-*  ...       // 32000 tokens
-*/
+ * Helper function to decode the vocabulary.
+ *
+ * vocab_base64 is base64-encoded string of tokens delimited by '\n' (line break) in utf-8.
+ * The row number of the token (indexing from 0) represents the id of the token in LLaMA tokenizer.
+ *
+ * Most tokens look like this: "ic" (without the quotes) (representing the "i" character followed by the "c" character)
+ * Some tokens are special. In particular, spaces are replaced with the "▁" character and line-break is represented as "<0x0A>".
+ *
+ * This helper function returns the vocabulary as an array that contains Strings representing tokens:
+ *
+ *  "<unk>"   // Special token: unknown token
+ *  "<s>"     // Special token: beginning of string
+ *  "</s>"    // Special token: end of string
+ *  "<0x00>"  // Byte-level token representing the 0-byte
+ *  "<0x01>"  // Byte-level token ...
+ *  "<0x02>"  // Byte-level token ...
+ *  ...       // More byte-level tokens
+ *  "<0x0A>"  // Byte-level token representing '\n' (line break). This is one of the few byte-level tokens that appear to be actually needed in practice.
+ *  ...       // More byte-level tokens
+ *  "<0xFF>"  // Byte-level token ...
+ *  "▁▁"     // Token representing 2 consecutive spaces.
+ *  "▁t"     // Token representing the space character followed by the "t" character.
+ *  "er"      // Token representing the "e" character followed by the "r" character. Most tokens look like this.
+ *  ...       // 32000 tokens
+ */
 const decodeVocabulary = function (vocab_base64) {
-    const byteArray = Uint8Array.from(base64decode(vocab_base64), c => c.charCodeAt(0));
-    const textDecoder = new TextDecoder('utf-8');
+    const byteArray = Uint8Array.from(base64decode(vocab_base64), (c) => c.charCodeAt(0));
+    const textDecoder = new TextDecoder("utf-8");
     return textDecoder.decode(byteArray).split("\n");
 };
 const utf8ByteToHex = (c) => {
-    const hexValue = c.toString(16).toUpperCase().padStart(2, '0');
+    const hexValue = c.toString(16).toUpperCase().padStart(2, "0");
     return `<0x${hexValue}>`;
 };
 const hexToUtf8Byte = (hex) => {
-    const strippedHex = hex.replace(/<0x|>/g, '');
+    const strippedHex = hex.replace(/<0x|>/g, "");
     return parseInt(strippedHex, 16);
 };
 const utf8Encoder = new TextEncoder();
-const utf8Decoder = new TextDecoder('utf-8');
+const utf8Decoder = new TextDecoder("utf-8");
 class PriorityQueue {
     // PriorityQueue implementation is copied from https://stackoverflow.com/a/42919752 with minor refactoring
     constructor(comparator = (a, b) => a > b) {
@@ -106,7 +108,7 @@ class PriorityQueue {
         return this._heap[0];
     }
     push(...values) {
-        values.forEach(value => {
+        values.forEach((value) => {
             this._heap.push(value);
             this._siftUp();
         });
@@ -152,9 +154,14 @@ class PriorityQueue {
     }
     _siftDown() {
         let node = 0;
-        while ((this._left(node) < this.size() && this._greater(this._left(node), node)) ||
-            (this._right(node) < this.size() && this._greater(this._right(node), node))) {
-            let maxChild = (this._right(node) < this.size() && this._greater(this._right(node), this._left(node))) ? this._right(node) : this._left(node);
+        while ((this._left(node) < this.size() &&
+            this._greater(this._left(node), node)) ||
+            (this._right(node) < this.size() &&
+                this._greater(this._right(node), node))) {
+            let maxChild = this._right(node) < this.size() &&
+                this._greater(this._right(node), this._left(node))
+                ? this._right(node)
+                : this._left(node);
             this._swap(node, maxChild);
             node = maxChild;
         }
@@ -171,7 +178,7 @@ const mapCharactersToTokenIds = (prompt, add_bos_token, add_preceding_space) =>
         prompt = " " + prompt;
     }
     // Special: spaces are represented as thick underscore ▁ (id 29871)
-    const promptAltered = (prompt).replaceAll(" ", llamaTokenizer.vocabById[29871]);
+    const promptAltered = prompt.replaceAll(" ", llamaTokenizer.vocabById[29871]);
     // We need to use Array.from to iterate over characters in order to support UTF-8 multipoint characters
     const charArray = Array.from(promptAltered);
     // Transform each character to its corresponding token
@@ -190,7 +197,13 @@ const mapCharactersToTokenIds = (prompt, add_bos_token, add_preceding_space) =>
                 if (!(hex >= 0)) {
                     // This is not supposed to happen because the LLaMA vocabulary has a token corresponding to each byte,
                     // but if this happens regardless, let's follow the protocol and tokenize to <UNK> token instead of crashing.
-                    console.log('Encountered unknown character ' + c + " (partial UTF-8 byte " + bytes[j] + " + hex + " + utf8ByteToHex(bytes[j]) + ")");
+                    console.log("Encountered unknown character " +
+                        c +
+                        " (partial UTF-8 byte " +
+                        bytes[j] +
+                        " + hex + " +
+                        utf8ByteToHex(bytes[j]) +
+                        ")");
                     tokenIds[tokenIds.length - 1] = 0;
                 }
             }
@@ -203,8 +216,10 @@ const encode = (prompt, add_bos_token = true, add_preceding_space = true, log_pe
     if (log_performance) {
         startTime = performance.now();
     }
-    if (!llamaTokenizer.vocabById || !llamaTokenizer.vocabByString || !llamaTokenizer.merges) {
-        console.log('Tokenizer not initialized properly!');
+    if (!llamaTokenizer.vocabById ||
+        !llamaTokenizer.vocabByString ||
+        !llamaTokenizer.merges) {
+        console.log("Tokenizer not initialized properly!");
         return;
     }
     if (prompt.length === 0) {
@@ -221,7 +236,8 @@ const encode = (prompt, add_bos_token = true, add_preceding_space = true, log_pe
         // Merge priority is primarily determined by the location of the merge in the "merges" data,
         // secondarily determined by the relative position of the node in the linked list
         // (We want to perform equal merges from left to right)
-        const mergePrio = llamaTokenizer.merges.get(mergeIdentifierString) + leftNode.origPos / prompt.length;
+        const mergePrio = llamaTokenizer.merges.get(mergeIdentifierString) +
+            leftNode.origPos / prompt.length;
         if (mergePrio) {
             // If mergePrio not found in merges, that means this merge is not possible according to vocabulary.
             leftNode.mergePrio = mergePrio;
@@ -242,7 +258,7 @@ const encode = (prompt, add_bos_token = true, add_preceding_space = true, log_pe
             origPos: i,
             tokenId: tokenIds[i],
             prev: prevTokenNode,
-            next: null
+            next: null,
         };
         prevTokenNode.next = currTokenNode;
         addToMergeQueue(prevTokenNode);
@@ -271,7 +287,7 @@ const encode = (prompt, add_bos_token = true, add_preceding_space = true, log_pe
                 origPos: oldPrev.origPos,
                 tokenId: oldPrev.tokenId,
                 prev: oldPrev.prev,
-                next: oldPrev.next
+                next: oldPrev.next,
             };
             leftOfMerge.prev = newPrev;
             // Update linked list reference of "prev of prev"
@@ -288,7 +304,7 @@ const encode = (prompt, add_bos_token = true, add_preceding_space = true, log_pe
             origPos: leftOfMerge.origPos,
             tokenId: llamaTokenizer.vocabByString.get(leftOfMerge.mergeToString),
             prev: leftOfMerge.prev,
-            next: leftOfMerge.next.next
+            next: leftOfMerge.next.next,
         };
         // Consider adding to merge queue: prev--resultOfMerge
         if (resultOfMerge.prev) {
@@ -313,7 +329,7 @@ const encode = (prompt, add_bos_token = true, add_preceding_space = true, log_pe
     }
     if (log_performance) {
         const endTime = performance.now();
-        console.log('Tokenizer running time: ' + (endTime - startTime) + " milliseconds");
+        console.log("Tokenizer running time: " + (endTime - startTime) + " milliseconds");
     }
     return mergedTokenIds;
 };
@@ -331,7 +347,7 @@ const decode = function (tokenIds, add_bos_token = true, add_preceding_space = t
         else {
             // Typical case
             const utf8bytes = utf8Encoder.encode(tokenString);
-            utf8bytes.forEach(utf8Byte => utf8byteVals.push(utf8Byte));
+            utf8bytes.forEach((utf8Byte) => utf8byteVals.push(utf8Byte));
         }
     }
     const uint8Array = new Uint8Array(utf8byteVals);
@@ -342,7 +358,10 @@ const decode = function (tokenIds, add_bos_token = true, add_preceding_space = t
 };
 function runTests() {
     function isEqual(arr1, arr2) {
-        return arr1.length === arr2.length && arr1.every(function (value, index) { return value === arr2[index]; });
+        return (arr1.length === arr2.length &&
+            arr1.every(function (value, index) {
+                return value === arr2[index];
+            }));
     }
     function testCase(inputString, expectedTokenIds) {
         const actualTokens = encode(inputString, true, true, true);
@@ -366,57 +385,51 @@ function runTests() {
     // Equal prio merges are performed left-to-right (fixed in 1.1.1)
     testCase("ax\n####\nboo", [1, 4853, 13, 4136, 13, 833, 29877]);
     // UTF-8 multipoint character that should be found in vocabulary
-    testCase('镇', [1, 29871, 30411]);
+    testCase("镇", [1, 29871, 30411]);
     // UTF-8 multipoint character that should NOT be found in vocabulary, fallback to MULTIPLE byte tokens
-    testCase('🦙', [1, 29871, 243, 162, 169, 156]);
+    testCase("🦙", [1, 29871, 243, 162, 169, 156]);
     // Consecutive UTF-8 multipoint characters that are NOT found in a vocabulary and use DIFFERENT number of bytes
-    testCase('🦙Ꙋ', [1, 29871, 243, 162, 169, 156, 237, 156, 141]);
-    testCase('Ꙋ🦙', [1, 29871, 237, 156, 141, 243, 162, 169, 156]);
+    testCase("🦙Ꙋ", [1, 29871, 243, 162, 169, 156, 237, 156, 141]);
+    testCase("Ꙋ🦙", [1, 29871, 237, 156, 141, 243, 162, 169, 156]);
     // Larger text input with various special characters sprinkled in
-    testCase("The llama (/ˈlɑːmə/; 🦙Spanish pronunciation: [ˈʎama]) (Lama glama) is a domesticated South American camelid, widely used as a meat and pack animal by Andean cultures since the Pre-Columbian era. Llamas are social animals and live with others as a herd. Their wool is soft and contains only a small amount of lanolin.[2] Llamas can learn simple tasks after a few repetitions. When using a pack, they can carry about 25 to 30% of their body weight for 8 to 13 km (5–8 miles).[3] The name llama (in the past also spelled \"lama\" or \"glama\") was adopted by European settlers from native Peruvians.[4] The ancestors of llamas are thought to have originated from the Great Plains of North America about 40 million years ago, and subsequently migrated to South America about three million years ago during the Great American Interchange. By the end of the last ice age (10,000–12,000 years ago), camelids were extinct in North America.[3] As of 2007, there were over seven million llamas and alpacas in South America and over 158,000 llamas and 100,000Ꙋ🦙 alpacas, descended from progenitors imported late in the 20th century, in the United States and Canada.[5] In Aymara mythology, llamas are important beings. The Heavenly Llama is said to drink water from the ocean and urinates as it rains.[6] According to Aymara eschatology, llamas will return to the water springs and lagoons where they come from at the end of time.[6]", [1, 450, 11148, 3304, 20374, 30176, 29880, 30426, 30215, 29885,
-        30184, 29914, 29936, 29871, 243, 162, 169, 156, 15495, 728,
-        11504, 11173, 362, 29901, 518, 30176, 31743, 3304, 2314, 313,
-        29931, 3304, 3144, 3304, 29897, 338, 263, 21849, 630, 4275,
-        3082, 3949, 295, 333, 29892, 17644, 1304, 408, 263, 27654,
-        322, 4870, 13019, 491, 1126, 29872, 273, 4185, 1973, 1951,
-        278, 4721, 29899, 1625, 3774, 713, 3152, 29889, 365, 5288,
-        294, 526, 5264, 15006, 322, 5735, 411, 4045, 408, 263,
-        902, 29881, 29889, 11275, 281, 1507, 338, 4964, 322, 3743,
-        871, 263, 2319, 5253, 310, 10906, 22878, 7226, 29906, 29962,
-        365, 5288, 294, 508, 5110, 2560, 9595, 1156, 263, 2846,
-        21159, 2187, 29889, 1932, 773, 263, 4870, 29892, 896, 508,
-        8677, 1048, 29871, 29906, 29945, 304, 29871, 29941, 29900, 29995,
-        310, 1009, 3573, 7688, 363, 29871, 29947, 304, 29871, 29896,
-        29941, 2383, 313, 29945, 29994, 29947, 7800, 467, 29961, 29941,
-        29962, 450, 1024, 11148, 3304, 313, 262, 278, 4940, 884,
-        805, 14356, 376, 29880, 3304, 29908, 470, 376, 3820, 3304,
-        1159, 471, 16356, 491, 7824, 3604, 9306, 515, 7531, 25493,
-        1403, 550, 7226, 29946, 29962, 450, 19525, 943, 310, 11829,
-        294, 526, 2714, 304, 505, 3978, 630, 515, 278, 7027,
-        13494, 1144, 310, 4644, 6813, 1048, 29871, 29946, 29900, 7284,
-        2440, 8020, 29892, 322, 17602, 9725, 630, 304, 4275, 6813,
-        1048, 2211, 7284, 2440, 8020, 2645, 278, 7027, 3082, 4124,
-        3167, 29889, 2648, 278, 1095, 310, 278, 1833, 14890, 5046,
-        313, 29896, 29900, 29892, 29900, 29900, 29900, 29994, 29896, 29906,
-        29892, 29900, 29900, 29900, 2440, 8020, 511, 3949, 295, 4841,
-        892, 1294, 5562, 297, 4644, 6813, 7226, 29941, 29962, 1094,
-        310, 29871, 29906, 29900, 29900, 29955, 29892, 727, 892, 975,
-        9881, 7284, 11829, 294, 322, 394, 29886, 562, 294, 297,
-        4275, 6813, 322, 975, 29871, 29896, 29945, 29947, 29892, 29900,
-        29900, 29900, 11829, 294, 322, 29871, 29896, 29900, 29900, 29892,
-        29900, 29900, 29900, 237, 156, 141, 243, 162, 169, 156,
-        394, 29886, 562, 294, 29892, 5153, 2760, 515, 410, 1885,
-        17259, 19673, 5683, 297, 278, 29871, 29906, 29900, 386, 6462,
-        29892, 297, 278, 3303, 3900, 322, 7400, 7226, 29945, 29962,
-        512, 319, 962, 2518, 22082, 3002, 29892, 11829, 294, 526,
-        4100, 367, 886, 29889, 450, 22977, 368, 365, 29880, 3304,
-        338, 1497, 304, 13748, 4094, 515, 278, 23474, 322, 5065,
-        262, 1078, 408, 372, 1153, 1144, 7226, 29953, 29962, 7579,
-        304, 319, 962, 2518, 831, 13496, 3002, 29892, 11829, 294,
-        674, 736, 304, 278, 4094, 7689, 886, 322, 301, 4425,
-        787, 988, 896, 2041, 515, 472, 278, 1095, 310, 931,
-        7226, 29953, 29962]);
-    console.log('LLaMA Tokenizer tests passed successfully.');
+    testCase('The llama (/ˈlɑːmə/; 🦙Spanish pronunciation: [ˈʎama]) (Lama glama) is a domesticated South American camelid, widely used as a meat and pack animal by Andean cultures since the Pre-Columbian era. Llamas are social animals and live with others as a herd. Their wool is soft and contains only a small amount of lanolin.[2] Llamas can learn simple tasks after a few repetitions. When using a pack, they can carry about 25 to 30% of their body weight for 8 to 13 km (5–8 miles).[3] The name llama (in the past also spelled "lama" or "glama") was adopted by European settlers from native Peruvians.[4] The ancestors of llamas are thought to have originated from the Great Plains of North America about 40 million years ago, and subsequently migrated to South America about three million years ago during the Great American Interchange. By the end of the last ice age (10,000–12,000 years ago), camelids were extinct in North America.[3] As of 2007, there were over seven million llamas and alpacas in South America and over 158,000 llamas and 100,000Ꙋ🦙 alpacas, descended from progenitors imported late in the 20th century, in the United States and Canada.[5] In Aymara mythology, llamas are important beings. The Heavenly Llama is said to drink water from the ocean and urinates as it rains.[6] According to Aymara eschatology, llamas will return to the water springs and lagoons where they come from at the end of time.[6]', [
+        1, 450, 11148, 3304, 20374, 30176, 29880, 30426, 30215, 29885, 30184,
+        29914, 29936, 29871, 243, 162, 169, 156, 15495, 728, 11504, 11173, 362,
+        29901, 518, 30176, 31743, 3304, 2314, 313, 29931, 3304, 3144, 3304, 29897,
+        338, 263, 21849, 630, 4275, 3082, 3949, 295, 333, 29892, 17644, 1304, 408,
+        263, 27654, 322, 4870, 13019, 491, 1126, 29872, 273, 4185, 1973, 1951,
+        278, 4721, 29899, 1625, 3774, 713, 3152, 29889, 365, 5288, 294, 526, 5264,
+        15006, 322, 5735, 411, 4045, 408, 263, 902, 29881, 29889, 11275, 281,
+        1507, 338, 4964, 322, 3743, 871, 263, 2319, 5253, 310, 10906, 22878, 7226,
+        29906, 29962, 365, 5288, 294, 508, 5110, 2560, 9595, 1156, 263, 2846,
+        21159, 2187, 29889, 1932, 773, 263, 4870, 29892, 896, 508, 8677, 1048,
+        29871, 29906, 29945, 304, 29871, 29941, 29900, 29995, 310, 1009, 3573,
+        7688, 363, 29871, 29947, 304, 29871, 29896, 29941, 2383, 313, 29945,
+        29994, 29947, 7800, 467, 29961, 29941, 29962, 450, 1024, 11148, 3304, 313,
+        262, 278, 4940, 884, 805, 14356, 376, 29880, 3304, 29908, 470, 376, 3820,
+        3304, 1159, 471, 16356, 491, 7824, 3604, 9306, 515, 7531, 25493, 1403,
+        550, 7226, 29946, 29962, 450, 19525, 943, 310, 11829, 294, 526, 2714, 304,
+        505, 3978, 630, 515, 278, 7027, 13494, 1144, 310, 4644, 6813, 1048, 29871,
+        29946, 29900, 7284, 2440, 8020, 29892, 322, 17602, 9725, 630, 304, 4275,
+        6813, 1048, 2211, 7284, 2440, 8020, 2645, 278, 7027, 3082, 4124, 3167,
+        29889, 2648, 278, 1095, 310, 278, 1833, 14890, 5046, 313, 29896, 29900,
+        29892, 29900, 29900, 29900, 29994, 29896, 29906, 29892, 29900, 29900,
+        29900, 2440, 8020, 511, 3949, 295, 4841, 892, 1294, 5562, 297, 4644, 6813,
+        7226, 29941, 29962, 1094, 310, 29871, 29906, 29900, 29900, 29955, 29892,
+        727, 892, 975, 9881, 7284, 11829, 294, 322, 394, 29886, 562, 294, 297,
+        4275, 6813, 322, 975, 29871, 29896, 29945, 29947, 29892, 29900, 29900,
+        29900, 11829, 294, 322, 29871, 29896, 29900, 29900, 29892, 29900, 29900,
+        29900, 237, 156, 141, 243, 162, 169, 156, 394, 29886, 562, 294, 29892,
+        5153, 2760, 515, 410, 1885, 17259, 19673, 5683, 297, 278, 29871, 29906,
+        29900, 386, 6462, 29892, 297, 278, 3303, 3900, 322, 7400, 7226, 29945,
+        29962, 512, 319, 962, 2518, 22082, 3002, 29892, 11829, 294, 526, 4100,
+        367, 886, 29889, 450, 22977, 368, 365, 29880, 3304, 338, 1497, 304, 13748,
+        4094, 515, 278, 23474, 322, 5065, 262, 1078, 408, 372, 1153, 1144, 7226,
+        29953, 29962, 7579, 304, 319, 962, 2518, 831, 13496, 3002, 29892, 11829,
+        294, 674, 736, 304, 278, 4094, 7689, 886, 322, 301, 4425, 787, 988, 896,
+        2041, 515, 472, 278, 1095, 310, 931, 7226, 29953, 29962,
+    ]);
+    console.log("LLaMA Tokenizer tests passed successfully.");
     return true;
 }
 function initializeLlamaTokenizer() {

package/dist/lib/_trie.js CHANGED Viewed

@@ -20,7 +20,7 @@ class Trie {
      */
     addPrefix(prefix) {
         let node = this.root;
-        prefix.forEach(num => {
+        prefix.forEach((num) => {
             if (!node.children.has(num)) {
                 node.children.set(num, new TrieNode());
             }

package/dist/lib/template.d.ts CHANGED Viewed

@@ -1,5 +1,5 @@
-import { AbstractTokenizer } from './tokenizer';
-import { AbstractTokenGenerator } from './token-generator';
+import { AbstractTokenizer } from "./tokenizer";
+import { AbstractTokenGenerator } from "./token-generator";
 export declare enum TEMPLATE_METHODS {
     SEL = "SEL",
     GEN = "GEN"
@@ -11,6 +11,7 @@ export declare class TemplateProcessor {
     setTokenizer(tokenizer: AbstractTokenizer): void;
     setGenerator(generator: AbstractTokenGenerator): void;
     processTemplate(template: string, variables: Map<string, string | string[]>): Promise<Map<string, string>>;
+    processTemplateStream(template: string, variables: Map<string, string | string[]>): AsyncGenerator<Map<string, string>, void>;
     private findAllIndexes;
 }
 //# sourceMappingURL=template.d.ts.map

package/dist/lib/template.d.ts.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"template.d.ts","sourceRoot":"","sources":["../../src/lib/template.ts"],"names":[],"mappings":"AACA,OAAO,EAAE,iBAAiB,EAAE,MAAM,aAAa,CAAC;AAChD,OAAO,EAAE,sBAAsB,EAAE,MAAM,mBAAmB,CAAC;AAE3D,oBAAY,gBAAgB;IAC1B,GAAG,QAAQ;IACX,GAAG,QAAQ;CACZ;AAED,qBAAa,iBAAiB;IAC5B,OAAO,CAAC,SAAS,CAAoB;IACrC,OAAO,CAAC,SAAS,CAAyB;gBAE9B,SAAS,EAAE,iBAAiB,EAAE,SAAS,EAAE,sBAAsB;IAKpE,YAAY,CAAC,SAAS,EAAE,iBAAiB;IAIzC,YAAY,CAAC,SAAS,EAAE,sBAAsB;IAIxC,eAAe,~~CAAC~~,QAAQ,EAAE,MAAM,~~EAAE~~,SAAS,EAAE,GAAG,CAAC,MAAM,EAAE,MAAM,~~GAAC~~,MAAM,EAAE,CAAC,~~GAAG~~,OAAO,CAAC,GAAG,CAAC,MAAM,EAAE,MAAM,CAAC,CAAC;~~IAkFrH~~,OAAO,CAAC,cAAc;CAQvB"}
1	+ {"version":3,"file":"template.d.ts","sourceRoot":"","sources":["../../src/lib/template.ts"],"names":[],"mappings":"AACA,OAAO,EAAE,iBAAiB,EAAE,MAAM,aAAa,CAAC;AAChD,OAAO,EAAE,sBAAsB,EAAE,MAAM,mBAAmB,CAAC;AAE3D,oBAAY,gBAAgB;IAC1B,GAAG,QAAQ;IACX,GAAG,QAAQ;CACZ;AAED,qBAAa,iBAAiB;IAC5B,OAAO,CAAC,SAAS,CAAoB;IACrC,OAAO,CAAC,SAAS,CAAyB;gBAE9B,SAAS,EAAE,iBAAiB,EAAE,SAAS,EAAE,sBAAsB;IAKpE,YAAY,CAAC,SAAS,EAAE,iBAAiB;IAIzC,YAAY,CAAC,SAAS,EAAE,sBAAsB;IAIxC,eAAe,CAC1B,QAAQ,EAAE,MAAM,EAChB,SAAS,EAAE,GAAG,CAAC,MAAM,EAAE,MAAM,GAAG,MAAM,EAAE,CAAC,GACxC,OAAO,CAAC,GAAG,CAAC,MAAM,EAAE,MAAM,CAAC,CAAC;IAYjB,qBAAqB,CACjC,QAAQ,EAAE,MAAM,EAChB,SAAS,EAAE,GAAG,CAAC,MAAM,EAAE,MAAM,GAAG,MAAM,EAAE,CAAC,GACxC,cAAc,CAAC,GAAG,CAAC,MAAM,EAAE,MAAM,CAAC,EAAE,IAAI,CAAC;IA2G5C,OAAO,CAAC,cAAc;CAQvB"}

package/dist/lib/template.js CHANGED Viewed

@@ -8,6 +8,25 @@ var __awaiter = (this && this.__awaiter) || function (thisArg, _arguments, P, ge
         step((generator = generator.apply(thisArg, _arguments || [])).next());
     });
 };
+var __asyncValues = (this && this.__asyncValues) || function (o) {
+    if (!Symbol.asyncIterator) throw new TypeError("Symbol.asyncIterator is not defined.");
+    var m = o[Symbol.asyncIterator], i;
+    return m ? m.call(o) : (o = typeof __values === "function" ? __values(o) : o[Symbol.iterator](), i = {}, verb("next"), verb("throw"), verb("return"), i[Symbol.asyncIterator] = function () { return this; }, i);
+    function verb(n) { i[n] = o[n] && function (v) { return new Promise(function (resolve, reject) { v = o[n](v), settle(resolve, reject, v.done, v.value); }); }; }
+    function settle(resolve, reject, d, v) { Promise.resolve(v).then(function(v) { resolve({ value: v, done: d }); }, reject); }
+};
+var __await = (this && this.__await) || function (v) { return this instanceof __await ? (this.v = v, this) : new __await(v); }
+var __asyncGenerator = (this && this.__asyncGenerator) || function (thisArg, _arguments, generator) {
+    if (!Symbol.asyncIterator) throw new TypeError("Symbol.asyncIterator is not defined.");
+    var g = generator.apply(thisArg, _arguments || []), i, q = [];
+    return i = {}, verb("next"), verb("throw"), verb("return"), i[Symbol.asyncIterator] = function () { return this; }, i;
+    function verb(n) { if (g[n]) i[n] = function (v) { return new Promise(function (a, b) { q.push([n, v, a, b]) > 1 || resume(n, v); }); }; }
+    function resume(n, v) { try { step(g[n](v)); } catch (e) { settle(q[0][3], e); } }
+    function step(r) { r.value instanceof __await ? Promise.resolve(r.value.v).then(fulfill, reject) : settle(q[0][2], r); }
+    function fulfill(value) { resume("next", value); }
+    function reject(value) { resume("throw", value); }
+    function settle(f, v) { if (f(v), q.shift(), q.length) resume(q[0][0], q[0][1]); }
+};
 var __importDefault = (this && this.__importDefault) || function (mod) {
     return (mod && mod.__esModule) ? mod : { "default": mod };
 };
@@ -31,50 +50,94 @@ class TemplateProcessor {
         this.generator = generator;
     }
     processTemplate(template, variables) {
+        var _a, e_1, _b, _c;
         return __awaiter(this, void 0, void 0, function* () {
+            let finalResult = new Map();
+            try {
+                for (var _d = true, _e = __asyncValues(this.processTemplateStream(template, variables)), _f; _f = yield _e.next(), _a = _f.done, !_a; _d = true) {
+                    _c = _f.value;
+                    _d = false;
+                    const partialResult = _c;
+                    finalResult = partialResult;
+                }
+            }
+            catch (e_1_1) { e_1 = { error: e_1_1 }; }
+            finally {
+                try {
+                    if (!_d && !_a && (_b = _e.return)) yield _b.call(_e);
+                }
+                finally { if (e_1) throw e_1.error; }
+            }
+            return finalResult;
+        });
+    }
+    processTemplateStream(template, variables) {
+        return __asyncGenerator(this, arguments, function* processTemplateStream_1() {
+            var _a, e_2, _b, _c;
             const result = new Map();
             // Replace {{val}} in template with variables[val]
             variables.forEach((value, key) => {
-                template = template.replace(new RegExp(`{{${key}}}`, 'g'), value.toString());
+                template = template.replace(new RegExp(`{{${key}}}`, "g"), value.toString());
             });
             // Replace {{method variableName methodArg1=methodArg1Value methodArg2=methodArg2Value}} in template
-            const indexes = this.findAllIndexes(template, '{{');
+            const indexes = this.findAllIndexes(template, "{{");
             let nextTemplateIndexForPrompt = 0;
-            let prompt = '';
+            let prompt = "";
             for (let i = 0; i < indexes.length; i++) {
                 prompt += template.substring(nextTemplateIndexForPrompt, indexes[i]);
                 const start = indexes[i] + 2;
-                const end = template.substring(start).indexOf('}}') + start;
+                const end = template.substring(start).indexOf("}}") + start;
                 const content = template.substring(start, end);
-                const args = content.split(' ');
+                const args = content.split(" ");
                 const method = args[0];
                 const variableName = args[1];
-                const methodArgs = args.slice(2).reduce((acc, arg) => {
-                    const [key, value] = arg.split('=');
+                const methodArgs = args
+                    .slice(2)
+                    .reduce((acc, arg) => {
+                    const [key, value] = arg.split("=");
                     acc[key] = value;
                     return acc;
                 }, {});
-                let completion = '';
+                let completion = "";
                 switch (method) {
                     case TEMPLATE_METHODS.GEN:
-                        completion = yield this.generator.generateString(prompt, methodArgs);
-                        // Remove string after stop
-                        if (methodArgs['stop']) {
-                            if (completion.indexOf(methodArgs['stop']) >= 0) {
-                                completion = completion.substring(0, completion.indexOf(methodArgs['stop']));
+                        const stream = this.generator.generateString(prompt, methodArgs);
+                        try {
+                            for (var _d = true, stream_1 = (e_2 = void 0, __asyncValues(stream)), stream_1_1; stream_1_1 = yield __await(stream_1.next()), _a = stream_1_1.done, !_a; _d = true) {
+                                _c = stream_1_1.value;
+                                _d = false;
+                                const chunk = _c;
+                                completion = chunk;
+                                // Remove string after stop
+                                if (methodArgs["stop"]) {
+                                    if (completion.indexOf(methodArgs["stop"]) >= 0) {
+                                        completion = completion.substring(0, completion.indexOf(methodArgs["stop"]));
+                                    }
+                                }
+                                result.set(variableName, completion);
+                                yield yield __await(result);
                             }
                         }
-                        result.set(variableName, completion);
+                        catch (e_2_1) { e_2 = { error: e_2_1 }; }
+                        finally {
+                            try {
+                                if (!_d && !_a && (_b = stream_1.return)) yield __await(_b.call(stream_1));
+                            }
+                            finally { if (e_2) throw e_2.error; }
+                        }
                         break;
                     case TEMPLATE_METHODS.SEL:
                         const trie = new _trie_1.default();
                         // Get options from variables
-                        const options = variables.get(methodArgs['options']);
+                        const options = variables.get(methodArgs["options"]);
                         if (!options) {
-                            throw new Error(`${methodArgs['options']} variable not found`);
+                            throw new Error(`${methodArgs["options"]} variable not found`);
                         }
                         // Add all options to trie
-                        options.forEach(option => trie.addPrefix(this.tokenizer.encodeString(prompt + option + this.tokenizer.getEOS())));
+                        options.forEach((option) => {
+                            const prefix = this.tokenizer.encodeString(prompt + option + this.tokenizer.getEOS());
+                            trie.addPrefix(prefix);
+                        });
                         let currentPrefixPrompt = prompt;
                         do {
                             const currentPrefix = trie.getNextPrefix(this.tokenizer.encodeString(currentPrefixPrompt));
@@ -82,19 +145,23 @@ class TemplateProcessor {
                             const nextChildren = trie.getNextChildren(currentPrefix);
                             if (nextChildren.length < 2) {
                                 // If there is only one child, we complete
-                                completion = this.tokenizer.decodeString(trie.getWord(currentPrefix)).substring(prompt.length).replace(this.tokenizer.getEOS(), '');
+                                completion = this.tokenizer
+                                    .decodeString(trie.getWord(currentPrefix))
+                                    .substring(prompt.length)
+                                    .replace(this.tokenizer.getEOS(), "");
                                 break;
                             }
                             else {
                                 // If there is more than one child, we generate the next token
-                                const nextToken = yield this.generator.generateToken(prompt, nextChildren.reduce((acc, child) => {
+                                const nextToken = yield __await(this.generator.generateToken(prompt, nextChildren.reduce((acc, child) => {
                                     acc[child.toString()] = 100;
                                     return acc;
-                                }, {}));
+                                }, {})));
                                 currentPrefixPrompt = currentPrefixPrompt + nextToken;
                             }
                         } while (!completion);
                         result.set(variableName, completion);
+                        yield yield __await(result);
                         break;
                     default:
                         throw new Error(`Invalid method ${method} in template`);
@@ -102,7 +169,6 @@ class TemplateProcessor {
                 prompt += completion;
                 nextTemplateIndexForPrompt = end + 2;
             }
-            return result;
         });
     }
     findAllIndexes(str, substr) {

package/dist/lib/token-generator.d.ts CHANGED Viewed

@@ -1,7 +1,8 @@
-import { ClientOptions } from 'openai';
+import { ClientOptions } from "openai";
+import { CompletionCreateParams } from "openai/resources/completions.mjs";
 export declare abstract class AbstractTokenGenerator {
     abstract generateToken(prompt: string, logit_bias: Record<string, number>): Promise<string>;
-    abstract generateString(prompt: string, options: Record<string, string>): Promise<string>;
+    abstract generateString(prompt: string, options: Record<string, string>): AsyncGenerator<string>;
 }
 /**
  * OpenAI Token Generator
@@ -10,12 +11,13 @@ export declare abstract class AbstractTokenGenerator {
 export declare class OpenAITokenGenerator extends AbstractTokenGenerator {
     private openai;
     private model;
+    private defaultCompletionParams?;
     constructor(params: {
         apiKey: string;
         model: string;
         baseURL?: string;
-    }, options?: ClientOptions);
+    }, options?: ClientOptions, defaultCompletionParams?: CompletionCreateParams);
     generateToken(prompt: string, logit_bias: Record<string, number>): Promise<string>;
-    generateString(prompt: string, options: Record<string, string>): Promise<string>;
+    generateString(prompt: string, options: Record<string, string>): AsyncGenerator<string>;
 }
 //# sourceMappingURL=token-generator.d.ts.map

package/dist/lib/token-generator.d.ts.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"token-generator.d.ts","sourceRoot":"","sources":["../../src/lib/token-generator.ts"],"names":[],"mappings":"AAAA,OAAe,EAAE,aAAa,EAAE,MAAM,QAAQ,~~CAAA~~;~~AAE9C~~,8BAAsB,sBAAsB;IAC1C,QAAQ,CAAC,aAAa,~~CAAC~~,MAAM,EAAE,MAAM,~~EAAE~~,UAAU,EAAE,MAAM,CAAC,MAAM,EAAE,MAAM,CAAC,~~GAAG~~,OAAO,CAAC,MAAM,CAAC;~~IAC3F~~,QAAQ,CAAC,cAAc,~~CAAC~~,MAAM,EAAE,MAAM,~~EAAE~~,OAAO,EAAE,MAAM,CAAC,MAAM,EAAE,MAAM,CAAC,~~GAAG~~,~~OAAO~~,CAAC,MAAM,CAAC;~~CAC1F~~;AACD;;;GAGG;AACH,qBAAa,oBAAqB,SAAQ,sBAAsB;IAC9D,OAAO,CAAC,MAAM,CAAS;IACvB,OAAO,CAAC,KAAK,CAAS;~~gBAEV~~,MAAM,EAAE;~~QAClB~~,MAAM,EAAE,MAAM,CAAC;QACf,KAAK,EAAE,MAAM,CAAC;QACd,OAAO,CAAC,EAAE,MAAM,CAAC;KAClB,~~EAAE~~,OAAO,CAAC,EAAE,aAAa;~~IAUX~~,aAAa,~~CAAC~~,MAAM,EAAE,MAAM,~~EAAE~~,UAAU,EAAE,MAAM,CAAC,MAAM,EAAE,MAAM,CAAC,~~GAAG~~,OAAO,CAAC,MAAM,CAAC;~~IAoClF~~,cAAc,~~CAAC~~,MAAM,EAAE,MAAM,~~EAAE~~,OAAO,EAAE,MAAM,CAAC,MAAM,EAAE,MAAM,CAAC,~~GAAG~~,~~OAAO~~,CAAC,MAAM,CAAC;~~CAShG~~"}
1	+ {"version":3,"file":"token-generator.d.ts","sourceRoot":"","sources":["../../src/lib/token-generator.ts"],"names":[],"mappings":"AAAA,OAAe,EAAE,aAAa,EAAE,MAAM,QAAQ,CAAC;AAC/C,OAAO,EAAE,sBAAsB,EAAE,MAAM,kCAAkC,CAAC;AAE1E,8BAAsB,sBAAsB;IAC1C,QAAQ,CAAC,aAAa,CACpB,MAAM,EAAE,MAAM,EACd,UAAU,EAAE,MAAM,CAAC,MAAM,EAAE,MAAM,CAAC,GACjC,OAAO,CAAC,MAAM,CAAC;IAClB,QAAQ,CAAC,cAAc,CACrB,MAAM,EAAE,MAAM,EACd,OAAO,EAAE,MAAM,CAAC,MAAM,EAAE,MAAM,CAAC,GAC9B,cAAc,CAAC,MAAM,CAAC;CAC1B;AACD;;;GAGG;AACH,qBAAa,oBAAqB,SAAQ,sBAAsB;IAC9D,OAAO,CAAC,MAAM,CAAS;IACvB,OAAO,CAAC,KAAK,CAAS;IACtB,OAAO,CAAC,uBAAuB,CAAC,CAAyB;gBAGvD,MAAM,EAAE;QACN,MAAM,EAAE,MAAM,CAAC;QACf,KAAK,EAAE,MAAM,CAAC;QACd,OAAO,CAAC,EAAE,MAAM,CAAC;KAClB,EACD,OAAO,CAAC,EAAE,aAAa,EACvB,uBAAuB,CAAC,EAAE,sBAAsB;IAYnC,aAAa,CAC1B,MAAM,EAAE,MAAM,EACd,UAAU,EAAE,MAAM,CAAC,MAAM,EAAE,MAAM,CAAC,GACjC,OAAO,CAAC,MAAM,CAAC;IAwCF,cAAc,CAC5B,MAAM,EAAE,MAAM,EACd,OAAO,EAAE,MAAM,CAAC,MAAM,EAAE,MAAM,CAAC,GAC9B,cAAc,CAAC,MAAM,CAAC;CAkB1B"}

package/dist/lib/token-generator.js CHANGED Viewed

@@ -8,6 +8,25 @@ var __awaiter = (this && this.__awaiter) || function (thisArg, _arguments, P, ge
         step((generator = generator.apply(thisArg, _arguments || [])).next());
     });
 };
+var __await = (this && this.__await) || function (v) { return this instanceof __await ? (this.v = v, this) : new __await(v); }
+var __asyncValues = (this && this.__asyncValues) || function (o) {
+    if (!Symbol.asyncIterator) throw new TypeError("Symbol.asyncIterator is not defined.");
+    var m = o[Symbol.asyncIterator], i;
+    return m ? m.call(o) : (o = typeof __values === "function" ? __values(o) : o[Symbol.iterator](), i = {}, verb("next"), verb("throw"), verb("return"), i[Symbol.asyncIterator] = function () { return this; }, i);
+    function verb(n) { i[n] = o[n] && function (v) { return new Promise(function (resolve, reject) { v = o[n](v), settle(resolve, reject, v.done, v.value); }); }; }
+    function settle(resolve, reject, d, v) { Promise.resolve(v).then(function(v) { resolve({ value: v, done: d }); }, reject); }
+};
+var __asyncGenerator = (this && this.__asyncGenerator) || function (thisArg, _arguments, generator) {
+    if (!Symbol.asyncIterator) throw new TypeError("Symbol.asyncIterator is not defined.");
+    var g = generator.apply(thisArg, _arguments || []), i, q = [];
+    return i = {}, verb("next"), verb("throw"), verb("return"), i[Symbol.asyncIterator] = function () { return this; }, i;
+    function verb(n) { if (g[n]) i[n] = function (v) { return new Promise(function (a, b) { q.push([n, v, a, b]) > 1 || resume(n, v); }); }; }
+    function resume(n, v) { try { step(g[n](v)); } catch (e) { settle(q[0][3], e); } }
+    function step(r) { r.value instanceof __await ? Promise.resolve(r.value.v).then(fulfill, reject) : settle(q[0][2], r); }
+    function fulfill(value) { resume("next", value); }
+    function reject(value) { resume("throw", value); }
+    function settle(f, v) { if (f(v), q.shift(), q.length) resume(q[0][0], q[0][1]); }
+};
 var __importDefault = (this && this.__importDefault) || function (mod) {
     return (mod && mod.__esModule) ? mod : { "default": mod };
 };
@@ -22,26 +41,24 @@ exports.AbstractTokenGenerator = AbstractTokenGenerator;
  *
  */
 class OpenAITokenGenerator extends AbstractTokenGenerator {
-    constructor(params, options) {
+    constructor(params, options, defaultCompletionParams) {
         super();
         this.model = params.model;
         this.openai = new openai_1.default(Object.assign({ apiKey: params.apiKey, baseURL: params.baseURL }, options));
+        this.defaultCompletionParams = defaultCompletionParams;
     }
     generateToken(prompt, logit_bias) {
         var _a;
         return __awaiter(this, void 0, void 0, function* () {
-            const result = yield this.openai.completions.create({
-                model: this.model,
-                prompt,
-                logit_bias,
-                logprobs: 10,
-                max_tokens: 1,
-            });
+            const result = yield this.openai.completions.create(Object.assign(Object.assign({}, this.defaultCompletionParams), { stream: false, model: this.model, prompt,
+                logit_bias, logprobs: 10, max_tokens: 1 }));
             const logprobsResult = ((_a = result.choices[0].logprobs) === null || _a === void 0 ? void 0 : _a.top_logprobs) || [];
-            const top_logprobs = logprobsResult ? logprobsResult[0] : { '2': 0 };
+            const top_logprobs = logprobsResult
+                ? logprobsResult[0]
+                : { "2": 0 };
             // get max top_logpobs that is in logit_bias
             let max = -Infinity;
-            let max_key = '';
+            let max_key = "";
             for (const key in top_logprobs) {
                 if (top_logprobs[key] > max && key in logit_bias) {
                     max = top_logprobs[key];
@@ -49,7 +66,7 @@ class OpenAITokenGenerator extends AbstractTokenGenerator {
                 }
             }
             // if no key in logit_bias, get max top_logprobs
-            if (max_key === '') {
+            if (max_key === "") {
                 // no key in logit_bias
                 max = -Infinity;
                 for (const key in top_logprobs) {
@@ -63,9 +80,30 @@ class OpenAITokenGenerator extends AbstractTokenGenerator {
         });
     }
     generateString(prompt, options) {
-        return __awaiter(this, void 0, void 0, function* () {
-            const result = yield this.openai.completions.create(Object.assign({ model: this.model, prompt }, options));
-            return result.choices[0].text;
+        var _a, _b;
+        return __asyncGenerator(this, arguments, function* generateString_1() {
+            var _c, e_1, _d, _e;
+            const stream = yield __await(this.openai.completions.create(Object.assign(Object.assign(Object.assign({}, this.defaultCompletionParams), options), { stop: [
+                    ...(((_a = this.defaultCompletionParams) === null || _a === void 0 ? void 0 : _a.stop) || []),
+                    ...(options.stop ? options.stop.split(",") : []),
+                ], model: this.model, prompt, stream: true })));
+            let result = "";
+            try {
+                for (var _f = true, stream_1 = __asyncValues(stream), stream_1_1; stream_1_1 = yield __await(stream_1.next()), _c = stream_1_1.done, !_c; _f = true) {
+                    _e = stream_1_1.value;
+                    _f = false;
+                    const chunk = _e;
+                    result += (_b = chunk.choices[0]) === null || _b === void 0 ? void 0 : _b.text;
+                    yield yield __await(result);
+                }
+            }
+            catch (e_1_1) { e_1 = { error: e_1_1 }; }
+            finally {
+                try {
+                    if (!_f && !_c && (_d = stream_1.return)) yield __await(_d.call(stream_1));
+                }
+                finally { if (e_1) throw e_1.error; }
+            }
         });
     }
 }

package/dist/lib/tokenizer.d.ts.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"tokenizer.d.ts","sourceRoot":"","sources":["../../src/lib/tokenizer.ts"],"names":[],"mappings":"AAGA,8BAAsB,iBAAiB;IACrC,QAAQ,CAAC,YAAY,CAAC,GAAG,EAAE,MAAM,GAAG,MAAM,EAAE;IAC5C,QAAQ,CAAC,YAAY,CAAC,GAAG,EAAE,MAAM,EAAE,GAAG,MAAM;IAC5C,QAAQ,CAAC,MAAM,IAAI,MAAM;CAC1B;AAED,qBAAa,cAAe,SAAQ,iBAAiB;IAC1C,YAAY,~~CAAC~~,GAAG,EAAE,MAAM,~~EAAE~~,aAAa,CAAC,EAAE,OAAO,~~EAAE~~,mBAAmB,CAAC,EAAE,OAAO,~~EAAE~~,eAAe,CAAC,EAAE,OAAO,~~GAAG~~,MAAM,EAAE;~~IAWtH~~,YAAY,~~CAAC~~,GAAG,EAAE,MAAM,EAAE,~~EAAE~~,aAAa,CAAC,EAAE,OAAO,~~EAAE~~,mBAAmB,CAAC,EAAE,OAAO,~~GAAG~~,MAAM;~~IAQ3F~~,MAAM,IAAI,MAAM;CAG1B;AAED,qBAAa,YAAa,SAAQ,iBAAiB;IACxC,YAAY,CAAC,GAAG,EAAE,MAAM,GAAG,MAAM,EAAE;IAMnC,YAAY,CAAC,GAAG,EAAE,MAAM,EAAE,GAAG,MAAM;IAInC,MAAM,IAAI,MAAM;CAG1B"}
1	+ {"version":3,"file":"tokenizer.d.ts","sourceRoot":"","sources":["../../src/lib/tokenizer.ts"],"names":[],"mappings":"AAGA,8BAAsB,iBAAiB;IACrC,QAAQ,CAAC,YAAY,CAAC,GAAG,EAAE,MAAM,GAAG,MAAM,EAAE;IAC5C,QAAQ,CAAC,YAAY,CAAC,GAAG,EAAE,MAAM,EAAE,GAAG,MAAM;IAC5C,QAAQ,CAAC,MAAM,IAAI,MAAM;CAC1B;AAED,qBAAa,cAAe,SAAQ,iBAAiB;IAC1C,YAAY,CACnB,GAAG,EAAE,MAAM,EACX,aAAa,CAAC,EAAE,OAAO,EACvB,mBAAmB,CAAC,EAAE,OAAO,EAC7B,eAAe,CAAC,EAAE,OAAO,GACxB,MAAM,EAAE;IAqBF,YAAY,CACnB,GAAG,EAAE,MAAM,EAAE,EACb,aAAa,CAAC,EAAE,OAAO,EACvB,mBAAmB,CAAC,EAAE,OAAO,GAC5B,MAAM;IAWA,MAAM,IAAI,MAAM;CAG1B;AAED,qBAAa,YAAa,SAAQ,iBAAiB;IACxC,YAAY,CAAC,GAAG,EAAE,MAAM,GAAG,MAAM,EAAE;IAMnC,YAAY,CAAC,GAAG,EAAE,MAAM,EAAE,GAAG,MAAM;IAInC,MAAM,IAAI,MAAM;CAG1B"}

package/dist/lib/tokenizer.js CHANGED Viewed

@@ -15,7 +15,7 @@ class LLaMATokenizer extends AbstractTokenizer {
             str = str.substring(0, str.length - this.getEOS().length);
             return [
                 ..._llama_tokenizer_1.default.encode(str, add_bos_token, add_preceding_space, log_performance),
-                2 // EOS
+                2, // EOS
             ];
         }
         return _llama_tokenizer_1.default.encode(str, add_bos_token, add_preceding_space, log_performance);
@@ -23,26 +23,27 @@ class LLaMATokenizer extends AbstractTokenizer {
     decodeString(arr, add_bos_token, add_preceding_space) {
         if (arr[arr.length - 1] === 2) {
             arr = arr.slice(0, arr.length - 1);
-            return _llama_tokenizer_1.default.decode(arr, add_bos_token, add_preceding_space) + this.getEOS();
+            return (_llama_tokenizer_1.default.decode(arr, add_bos_token, add_preceding_space) +
+                this.getEOS());
         }
         return _llama_tokenizer_1.default.decode(arr, add_bos_token, add_preceding_space);
     }
     getEOS() {
-        return '</s>';
+        return "</s>";
     }
 }
 exports.LLaMATokenizer = LLaMATokenizer;
 class GTPTokenizer extends AbstractTokenizer {
     encodeString(str) {
         return (0, gpt_tokenizer_1.encode)(str, {
-            allowedSpecial: new Set([this.getEOS()])
+            allowedSpecial: new Set([this.getEOS()]),
         });
     }
     decodeString(arr) {
         return (0, gpt_tokenizer_1.decode)(arr);
     }
     getEOS() {
-        return '<|endoftext|>';
+        return "<|endoftext|>";
     }
 }
 exports.GTPTokenizer = GTPTokenizer;

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@mikugg/guidance",
-  "version": "0.8.0",
+  "version": "0.10.0",
   "description": "",
   "main": "dist/index.js",
   "types": "dist/index.d.ts",
@@ -39,5 +39,5 @@
     "ts-node": "^10.9.1",
     "typescript": "^5.2.2"
   },
-  "gitHead": "e0e2c0cc7fbde0c7d477a6907658a76a18e4fd0b"
+  "gitHead": "73073416020c05b15d4f58805fe914743e7ffd6e"
 }