npm - @genai-fi/nanogpt - Versions diffs - 0.15.13 → 0.16.1 - Mend

@genai-fi/nanogpt 0.15.13 → 0.16.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (32) hide show

package/dist/TeachableLLM.d.ts +1 -1
package/dist/Trainer.js +10 -5
package/dist/data/docx.d.ts +2 -1
package/dist/data/docx.js +8 -8
package/dist/data/parquet.d.ts +2 -1
package/dist/data/parquet.js +5 -5
package/dist/data/pdf.d.ts +2 -1
package/dist/data/pdf.js +1 -1
package/dist/data/textLoader.d.ts +2 -1
package/dist/data/textLoader.js +55 -48
package/dist/tokeniser/BaseTokeniser.d.ts +2 -2
package/dist/tokeniser/BaseTokeniser.js +35 -35
package/dist/tokeniser/CharTokeniser.d.ts +2 -1
package/dist/tokeniser/CharTokeniser.js +15 -15
package/dist/tokeniser/bpe.d.ts +2 -1
package/dist/tokeniser/bpe.js +40 -40
package/dist/tokeniser/type.d.ts +2 -2
package/dist/training/BasicTrainer.js +62 -62
package/dist/training/Evaluator.d.ts +2 -1
package/dist/training/Evaluator.js +19 -18
package/dist/training/SFTDatasetBuilder.js +47 -38
package/dist/training/tasks/ConversationTask.d.ts +2 -2
package/dist/training/tasks/ConversationTask.js +13 -11
package/dist/training/tasks/PretrainingTask.d.ts +1 -2
package/dist/training/tasks/PretrainingTask.js +4 -14
package/dist/training/tasks/StartSentenceTask.d.ts +1 -2
package/dist/training/tasks/StartSentenceTask.js +2 -7
package/dist/training/tasks/Task.d.ts +1 -2
package/dist/training/tasks/splitter.d.ts +5 -0
package/dist/training/tasks/splitter.js +21 -0
package/dist/training/validation.js +1 -1
package/package.json +1 -1

package/dist/training/tasks/ConversationTask.js CHANGED Viewed

@@ -1,6 +1,8 @@
 import { Task as t } from "./Task.js";
+import { shuffle as s } from "../DatasetBuilder.js";
 class a extends t {
   rawConvo;
+  shuffledIndices = null;
   index = 0;
   get length() {
     return this.rawConvo.length;
@@ -14,20 +16,20 @@ class a extends t {
   nextConversation() {
     if (this.index >= this.rawConvo.length)
       return null;
-    const n = this.rawConvo[this.index];
+    const n = this.rawConvo[this.shuffledIndices ? this.shuffledIndices[this.index] : this.index];
     return this.index++, n;
   }
   nextTokens(n) {
-    const o = this.nextConversation();
-    return o ? n.encodeConversation(o) : null;
-  }
-  getRandomConversation() {
-    const n = Math.floor(Math.random() * this.rawConvo.length);
-    return this.rawConvo[n];
-  }
-  getRandomTokens(n) {
-    const o = Math.floor(Math.random() * this.rawConvo.length);
-    return n.encodeConversation(this.rawConvo[o]);
+    const e = this.nextConversation();
+    return e ? n.encodeConversation(e) : null;
+  }
+  shuffle() {
+    if (!this.shuffledIndices) {
+      this.shuffledIndices = new Uint32Array(this.rawConvo.length);
+      for (let n = 0; n < this.rawConvo.length; n++)
+        this.shuffledIndices[n] = n;
+    }
+    s(this.shuffledIndices), this.index = 0;
   }
   async estimateTokens(n) {
     return (await n.encodeConversation(this.rawConvo[0])).length * this.length;

package/dist/training/tasks/PretrainingTask.d.ts CHANGED Viewed

@@ -8,7 +8,6 @@ export default class PretrainingTask extends Task {
     hasMoreConversations(): boolean;
     nextConversation(): Conversation[] | null;
     nextTokens(tokeniser: ITokeniser): number[] | null;
-    getRandomConversation(): Conversation[];
-    getRandomTokens(tokeniser: ITokeniser): number[];
+    shuffle(): void;
     estimateTokens(tokeniser: ITokeniser): Promise<number>;
 }

package/dist/training/tasks/PretrainingTask.js CHANGED Viewed

@@ -1,5 +1,5 @@
 import { Task as n } from "./Task.js";
-class i extends n {
+class r extends n {
   rawText;
   index = 0;
   get length() {
@@ -26,18 +26,8 @@ class i extends n {
     const e = t.encodeSequence(this.rawText[this.index]);
     return this.index++, e;
   }
-  getRandomConversation() {
-    const t = Math.floor(Math.random() * this.rawText.length);
-    return [
-      {
-        role: "assistant",
-        content: this.rawText[t]
-      }
-    ];
-  }
-  getRandomTokens(t) {
-    const e = Math.floor(Math.random() * this.rawText.length);
-    return t.encodeSequence(this.rawText[e]);
+  shuffle() {
+    this.index = 0;
   }
   async estimateTokens(t) {
     return (await t.encodeConversation([
@@ -49,5 +39,5 @@ class i extends n {
   }
 }
 export {
-  i as default
+  r as default
 };

package/dist/training/tasks/StartSentenceTask.d.ts CHANGED Viewed

@@ -8,8 +8,7 @@ export default class StartSentenceTask extends Task {
     hasMoreConversations(): boolean;
     nextConversation(): Conversation[] | null;
     nextTokens(tokeniser: ITokeniser): number[] | null;
-    getRandomConversation(): Conversation[];
-    getRandomTokens(tokeniser: ITokeniser): number[];
+    shuffle(): void;
     private conversationFromString;
     estimateTokens(tokeniser: ITokeniser): Promise<number>;
 }

package/dist/training/tasks/StartSentenceTask.js CHANGED Viewed

@@ -21,13 +21,8 @@ class a extends e {
     const n = this.nextConversation();
     return n ? t.encodeConversation(n) : null;
   }
-  getRandomConversation() {
-    const t = Math.floor(Math.random() * this.rawText.length);
-    return this.conversationFromString(this.rawText[t]);
-  }
-  getRandomTokens(t) {
-    const n = this.getRandomConversation();
-    return t.encodeConversation(n);
+  shuffle() {
+    this.index = 0;
   }
   conversationFromString(t) {
     const n = t.indexOf(".");

package/dist/training/tasks/Task.d.ts CHANGED Viewed

@@ -5,7 +5,6 @@ export declare abstract class Task {
     abstract nextConversation(): Conversation[] | null;
     abstract nextTokens(tokeniser: ITokeniser): number[] | null;
     abstract estimateTokens(tokeniser: ITokeniser): Promise<number>;
-    abstract getRandomConversation(): Conversation[];
-    abstract getRandomTokens(tokeniser: ITokeniser): number[];
+    abstract shuffle(): void;
 }
 export declare function tokensFromTasks(tasks: Task[], tokenizer: ITokeniser, cb?: (tokens: number) => void): Promise<Uint16Array>;

package/dist/training/tasks/splitter.d.ts ADDED Viewed

@@ -0,0 +1,5 @@
+import { Task } from './Task';
+export default function splitValidation(tasks: Task[], validationSplit: number): {
+    training: Task;
+    validation: Task;
+};

package/dist/training/tasks/splitter.js ADDED Viewed

@@ -0,0 +1,21 @@
+import s from "./ConversationTask.js";
+function f(e, o) {
+  if (o <= 0 || o >= 1)
+    throw new Error("validationSplit must be between 0 and 1");
+  e.forEach((n) => n.shuffle());
+  const r = [], a = [];
+  for (const n of e)
+    for (; n.hasMoreConversations(); ) {
+      const t = n.nextConversation();
+      if (!t)
+        break;
+      Math.random() < o ? a.push(t) : r.push(t);
+    }
+  return {
+    training: new s(r),
+    validation: new s(a)
+  };
+}
+export {
+  f as default
+};

package/dist/training/validation.js CHANGED Viewed

@@ -39,8 +39,8 @@ import "../ops/webgl/adamAdjust.js";
 import "../ops/cpu/adamMoments.js";
 import "../ops/webgl/adamMoments.js";
 import { PAGE_FACTOR as m, shuffle as h } from "./DatasetBuilder.js";
-import "../papaparse.min-C0cScC2i.js";
 import { tokensFromTasks as k } from "./tasks/Task.js";
+import "../papaparse.min-C0cScC2i.js";
 import "../ops/cpu/matMulGelu.js";
 import "../matMulGelu-JNLZqKQp.js";
 import "../ops/grads/matMulGelu.js";

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
     "name": "@genai-fi/nanogpt",
-    "version": "0.15.13",
+    "version": "0.16.1",
     "type": "module",
     "main": "dist/main.js",
     "types": "dist/main.d.ts",