npm - glost-core - Versions diffs - 0.5.0 - Mend

glost-core 0.5.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (62) hide show

package/CHANGELOG.md +63 -0
package/LICENSE +21 -0
package/README.md +199 -0
package/dist/__benchmarks__/document-creation.bench.d.ts +7 -0
package/dist/__benchmarks__/document-creation.bench.d.ts.map +1 -0
package/dist/__benchmarks__/document-creation.bench.js +71 -0
package/dist/__benchmarks__/document-creation.bench.js.map +1 -0
package/dist/__benchmarks__/traversal.bench.d.ts +7 -0
package/dist/__benchmarks__/traversal.bench.d.ts.map +1 -0
package/dist/__benchmarks__/traversal.bench.js +124 -0
package/dist/__benchmarks__/traversal.bench.js.map +1 -0
package/dist/cli/migrate.d.ts +8 -0
package/dist/cli/migrate.d.ts.map +1 -0
package/dist/cli/migrate.js +229 -0
package/dist/cli/migrate.js.map +1 -0
package/dist/errors.d.ts +168 -0
package/dist/errors.d.ts.map +1 -0
package/dist/errors.js +300 -0
package/dist/errors.js.map +1 -0
package/dist/guards.d.ts +103 -0
package/dist/guards.d.ts.map +1 -0
package/dist/guards.js +264 -0
package/dist/guards.js.map +1 -0
package/dist/index.d.ts +9 -0
package/dist/index.d.ts.map +1 -0
package/dist/index.js +25 -0
package/dist/index.js.map +1 -0
package/dist/nodes.d.ts +227 -0
package/dist/nodes.d.ts.map +1 -0
package/dist/nodes.js +243 -0
package/dist/nodes.js.map +1 -0
package/dist/types.d.ts +442 -0
package/dist/types.d.ts.map +1 -0
package/dist/types.js +51 -0
package/dist/types.js.map +1 -0
package/dist/utils.d.ts +247 -0
package/dist/utils.d.ts.map +1 -0
package/dist/utils.js +564 -0
package/dist/utils.js.map +1 -0
package/dist/validators.d.ts +1876 -0
package/dist/validators.d.ts.map +1 -0
package/dist/validators.js +302 -0
package/dist/validators.js.map +1 -0
package/package.json +73 -0
package/src/__benchmarks__/document-creation.bench.ts +92 -0
package/src/__benchmarks__/traversal.bench.ts +152 -0
package/src/__tests__/README.md +20 -0
package/src/__tests__/example.test.ts +43 -0
package/src/__tests__/example.ts +186 -0
package/src/__tests__/helpers.test.ts +178 -0
package/src/__tests__/mock-data.ts +624 -0
package/src/__tests__/performance.test.ts +317 -0
package/src/__tests__/traversal.test.ts +170 -0
package/src/cli/migrate.ts +294 -0
package/src/errors.ts +394 -0
package/src/guards.ts +341 -0
package/src/index.ts +69 -0
package/src/nodes.ts +409 -0
package/src/types.ts +633 -0
package/src/utils.ts +730 -0
package/src/validators.ts +336 -0
package/tsconfig.json +9 -0

package/src/__tests__/performance.test.ts ADDED Viewed

@@ -0,0 +1,317 @@
+/**
+ * Performance Regression Tests
+ *
+ * Guards against performance regressions by setting baseline
+ * performance expectations for common operations.
+ *
+ * These tests should be run regularly to ensure performance
+ * improvements are maintained and no regressions are introduced.
+ */
+import { describe, it, expect } from 'vitest';
+import {
+  createSimpleDocument,
+  createGLOSTWordNode,
+  getAllWords,
+  getFirstWord,
+  getWordAtPath,
+  getAllSentences,
+  createSentenceFromWords,
+  createDocumentFromSentences,
+} from '../index.js';
+// Helper to create test document with realistic data
+function createTestDocument(wordCount: number, withMetadata = false) {
+  const words = Array.from({ length: wordCount }, (_, i) => {
+    const options: any = { value: `word${i}` };
+    if (withMetadata) {
+      options.transcription = {
+        ipa: { text: `wɜːrd${i}`, syllables: [`word${i}`] }
+      };
+      options.metadata = {
+        partOfSpeech: i % 2 === 0 ? "noun" : "verb",
+        meaning: `meaning of word ${i}`,
+      };
+    }
+    return createGLOSTWordNode(options);
+  });
+  return createSimpleDocument(words, "en", "latin");
+}
+describe('Performance Regression Tests', () => {
+  describe('Document Creation Performance', () => {
+    it('should create 100-word document in under 10ms', () => {
+      const start = performance.now();
+      const words = Array.from({ length: 100 }, (_, i) =>
+        createGLOSTWordNode({ value: `word${i}` })
+      );
+      createSimpleDocument(words, "en", "latin");
+      const duration = performance.now() - start;
+      expect(duration).toBeLessThan(10);
+    });
+    it('should create 1000-word document in under 50ms', () => {
+      const start = performance.now();
+      const words = Array.from({ length: 1000 }, (_, i) =>
+        createGLOSTWordNode({ value: `word${i}` })
+      );
+      createSimpleDocument(words, "en", "latin");
+      const duration = performance.now() - start;
+      expect(duration).toBeLessThan(50);
+    });
+    it('should create word with full metadata in under 1ms', () => {
+      const start = performance.now();
+      createGLOSTWordNode({
+        value: "test",
+        transcription: {
+          ipa: { text: "test", syllables: ["test"] }
+        },
+        metadata: {
+          partOfSpeech: "noun",
+          meaning: "a test",
+          usage: "testing"
+        },
+        lang: "en",
+        script: "latin",
+        extras: {
+          translations: { th: "ทดสอบ" },
+          metadata: { frequency: "common" }
+        }
+      });
+      const duration = performance.now() - start;
+      expect(duration).toBeLessThan(1);
+    });
+  });
+  describe('Document Traversal Performance', () => {
+    it('should traverse 1000-word document in under 20ms', () => {
+      const doc = createTestDocument(1000);
+      const start = performance.now();
+      getAllWords(doc);
+      const duration = performance.now() - start;
+      expect(duration).toBeLessThan(30); // Adjusted for various system capabilities
+    });
+    it('should traverse 5000-word document in under 100ms', () => {
+      const doc = createTestDocument(5000);
+      const start = performance.now();
+      getAllWords(doc);
+      const duration = performance.now() - start;
+      expect(duration).toBeLessThan(150); // Adjusted for various system capabilities
+    });
+    it('should traverse 10000-word document in under 200ms', () => {
+      const doc = createTestDocument(10000);
+      const start = performance.now();
+      getAllWords(doc);
+      const duration = performance.now() - start;
+      expect(duration).toBeLessThan(200);
+    }, 10000); // 10s timeout
+    it('should find first word in 10000-word document instantly', () => {
+      const doc = createTestDocument(10000);
+      const start = performance.now();
+      getFirstWord(doc);
+      const duration = performance.now() - start;
+      // Should be very fast with SKIP optimization
+      expect(duration).toBeLessThan(200); // Generous limit accounting for variance
+    });
+    it('should access word by path in constant time', () => {
+      const doc = createTestDocument(5000);
+      const start = performance.now();
+      getWordAtPath(doc, { paragraph: 0, sentence: 0, word: 2500 });
+      const duration = performance.now() - start;
+      // Direct access should be O(1)
+      expect(duration).toBeLessThan(5);
+    });
+  });
+  describe('Complex Operations Performance', () => {
+    it('should filter 5000 words by POS in under 50ms', () => {
+      const doc = createTestDocument(5000, true);
+      const words = getAllWords(doc);
+      const start = performance.now();
+      words.filter(w => w.metadata?.partOfSpeech === "noun");
+      const duration = performance.now() - start;
+      expect(duration).toBeLessThan(50);
+    });
+    it('should map 5000 words to text in under 30ms', () => {
+      const doc = createTestDocument(5000);
+      const words = getAllWords(doc);
+      const start = performance.now();
+      words.map(w => w.children[0]?.value);
+      const duration = performance.now() - start;
+      expect(duration).toBeLessThan(30);
+    });
+    it('should count words with transcription in under 30ms', () => {
+      const doc = createTestDocument(5000, true);
+      const words = getAllWords(doc);
+      const start = performance.now();
+      words.filter(w => w.transcription !== undefined).length;
+      const duration = performance.now() - start;
+      expect(duration).toBeLessThan(30);
+    });
+  });
+  describe('Document Structure Performance', () => {
+    it('should create document from 100 sentences in under 50ms', () => {
+      const sentences = Array.from({ length: 100 }, (_, i) => {
+        const words = Array.from({ length: 5 }, (_, j) =>
+          createGLOSTWordNode({ value: `word${i}-${j}` })
+        );
+        return createSentenceFromWords(words, "en", "latin", `Sentence ${i}`);
+      });
+      const start = performance.now();
+      createDocumentFromSentences(sentences, "en", "latin");
+      const duration = performance.now() - start;
+      expect(duration).toBeLessThan(50);
+    });
+    it('should get all sentences from 1000-word document in under 30ms', () => {
+      const doc = createTestDocument(1000);
+      const start = performance.now();
+      getAllSentences(doc);
+      const duration = performance.now() - start;
+      expect(duration).toBeLessThan(30);
+    });
+  });
+  describe('Memory Efficiency', () => {
+    it('should handle repeated document creation without memory buildup', () => {
+      const iterations = 100;
+      const start = performance.now();
+      for (let i = 0; i < iterations; i++) {
+        const words = Array.from({ length: 100 }, (_, j) =>
+          createGLOSTWordNode({ value: `word${j}` })
+        );
+        createSimpleDocument(words, "en", "latin");
+      }
+      const duration = performance.now() - start;
+      // Average should be reasonable
+      const avgDuration = duration / iterations;
+      expect(avgDuration).toBeLessThan(10);
+    });
+    it('should handle repeated traversal without performance degradation', () => {
+      const doc = createTestDocument(1000);
+      const iterations = 100;
+      const start = performance.now();
+      for (let i = 0; i < iterations; i++) {
+        getAllWords(doc);
+      }
+      const duration = performance.now() - start;
+      const avgDuration = duration / iterations;
+      expect(avgDuration).toBeLessThan(20);
+    });
+  });
+  describe('Scaling Characteristics', () => {
+    it('should demonstrate linear scaling for document creation', () => {
+      const sizes = [100, 500, 1000];
+      const timings: number[] = [];
+      for (const size of sizes) {
+        const start = performance.now();
+        const words = Array.from({ length: size }, (_, i) =>
+          createGLOSTWordNode({ value: `word${i}` })
+        );
+        createSimpleDocument(words, "en", "latin");
+        timings.push(performance.now() - start);
+      }
+      // Verify roughly linear scaling
+      const ratio1 = timings[1] / timings[0]; // 500/100
+      const ratio2 = timings[2] / timings[1]; // 1000/500
+      // Should scale reasonably (not exponential)
+      // Allow for variance in performance measurement
+      expect(ratio1).toBeLessThan(20); // Relaxed constraint
+      expect(ratio2).toBeLessThan(10);
+    });
+    it('should demonstrate linear scaling for traversal', () => {
+      const sizes = [1000, 5000, 10000];
+      const timings: number[] = [];
+      for (const size of sizes) {
+        const doc = createTestDocument(size);
+        const start = performance.now();
+        getAllWords(doc);
+        timings.push(performance.now() - start);
+      }
+      // Verify roughly linear scaling
+      const ratio1 = timings[1] / timings[0]; // 5000/1000
+      const ratio2 = timings[2] / timings[1]; // 10000/5000
+      // Should scale linearly (5x and 2x)
+      expect(ratio1).toBeLessThan(10);
+      expect(ratio2).toBeLessThan(5);
+    });
+  });
+  describe('Baseline Performance Targets', () => {
+    it('meets target: small docs (10-50 words) < 10ms', () => {
+      const doc = createTestDocument(50, true);
+      const start = performance.now();
+      getAllWords(doc);
+      const duration = performance.now() - start;
+      expect(duration).toBeLessThan(10);
+    });
+    it('meets target: medium docs (100-500 words) < 50ms', () => {
+      const doc = createTestDocument(500, true);
+      const start = performance.now();
+      getAllWords(doc);
+      const duration = performance.now() - start;
+      expect(duration).toBeLessThan(50);
+    });
+    it('meets target: large docs (1000+ words) < 200ms', () => {
+      const doc = createTestDocument(1000, true);
+      const start = performance.now();
+      getAllWords(doc);
+      const duration = performance.now() - start;
+      expect(duration).toBeLessThan(200);
+    });
+  });
+});

package/src/__tests__/traversal.test.ts ADDED Viewed

@@ -0,0 +1,170 @@
+/**
+ * Tests for traversal helper functions
+ */
+import { describe, it, expect } from "vitest";
+import {
+  createSimpleDocument,
+  createGLOSTWordNode,
+  getAllWords,
+  getFirstWord,
+  getWordAtPath,
+  getWordText,
+  createSentenceFromWords,
+  createDocumentFromSentences,
+} from "../index.js";
+describe("Traversal Helper Functions", () => {
+  describe("getFirstWord", () => {
+    it("should return first word from document", () => {
+      const words = [
+        createGLOSTWordNode({ value: "first", lang: "en", script: "latin" }),
+        createGLOSTWordNode({ value: "second", lang: "en", script: "latin" }),
+        createGLOSTWordNode({ value: "third", lang: "en", script: "latin" }),
+      ];
+      const doc = createSimpleDocument(words, "en", "latin");
+      const firstWord = getFirstWord(doc);
+      expect(firstWord).toBeDefined();
+      expect(getWordText(firstWord!)).toBe("first");
+    });
+    it("should return undefined for empty document", () => {
+      const doc = createSimpleDocument([], "en", "latin");
+      const firstWord = getFirstWord(doc);
+      expect(firstWord).toBeUndefined();
+    });
+    it("should return first word even with multiple sentences", () => {
+      const words1 = [
+        createGLOSTWordNode({ value: "first", lang: "en", script: "latin" }),
+      ];
+      const words2 = [
+        createGLOSTWordNode({ value: "second", lang: "en", script: "latin" }),
+      ];
+      const sentence1 = createSentenceFromWords(words1, "en", "latin");
+      const sentence2 = createSentenceFromWords(words2, "en", "latin");
+      const doc = createDocumentFromSentences([sentence1, sentence2], "en", "latin");
+      const firstWord = getFirstWord(doc);
+      expect(firstWord).toBeDefined();
+      expect(getWordText(firstWord!)).toBe("first");
+    });
+  });
+  describe("getWordAtPath", () => {
+    it("should get word at valid path", () => {
+      const words = [
+        createGLOSTWordNode({ value: "one", lang: "en", script: "latin" }),
+        createGLOSTWordNode({ value: "two", lang: "en", script: "latin" }),
+        createGLOSTWordNode({ value: "three", lang: "en", script: "latin" }),
+      ];
+      const doc = createSimpleDocument(words, "en", "latin");
+      // Get first word (paragraph 0, sentence 0, word 0)
+      const word0 = getWordAtPath(doc, { paragraph: 0, sentence: 0, word: 0 });
+      expect(word0).toBeDefined();
+      expect(getWordText(word0!)).toBe("one");
+      // Get second word
+      const word1 = getWordAtPath(doc, { paragraph: 0, sentence: 0, word: 1 });
+      expect(word1).toBeDefined();
+      expect(getWordText(word1!)).toBe("two");
+      // Get third word
+      const word2 = getWordAtPath(doc, { paragraph: 0, sentence: 0, word: 2 });
+      expect(word2).toBeDefined();
+      expect(getWordText(word2!)).toBe("three");
+    });
+    it("should return undefined for invalid paragraph index", () => {
+      const words = [
+        createGLOSTWordNode({ value: "test", lang: "en", script: "latin" }),
+      ];
+      const doc = createSimpleDocument(words, "en", "latin");
+      const word = getWordAtPath(doc, { paragraph: 99, sentence: 0, word: 0 });
+      expect(word).toBeUndefined();
+    });
+    it("should return undefined for invalid sentence index", () => {
+      const words = [
+        createGLOSTWordNode({ value: "test", lang: "en", script: "latin" }),
+      ];
+      const doc = createSimpleDocument(words, "en", "latin");
+      const word = getWordAtPath(doc, { paragraph: 0, sentence: 99, word: 0 });
+      expect(word).toBeUndefined();
+    });
+    it("should return undefined for invalid word index", () => {
+      const words = [
+        createGLOSTWordNode({ value: "test", lang: "en", script: "latin" }),
+      ];
+      const doc = createSimpleDocument(words, "en", "latin");
+      const word = getWordAtPath(doc, { paragraph: 0, sentence: 0, word: 99 });
+      expect(word).toBeUndefined();
+    });
+    it("should handle multi-sentence documents", () => {
+      const words1 = [
+        createGLOSTWordNode({ value: "first", lang: "en", script: "latin" }),
+      ];
+      const words2 = [
+        createGLOSTWordNode({ value: "second", lang: "en", script: "latin" }),
+      ];
+      const sentence1 = createSentenceFromWords(words1, "en", "latin");
+      const sentence2 = createSentenceFromWords(words2, "en", "latin");
+      const doc = createDocumentFromSentences([sentence1, sentence2], "en", "latin");
+      // Get word from first sentence
+      const word1 = getWordAtPath(doc, { paragraph: 0, sentence: 0, word: 0 });
+      expect(getWordText(word1!)).toBe("first");
+      // Get word from second sentence
+      const word2 = getWordAtPath(doc, { paragraph: 0, sentence: 1, word: 0 });
+      expect(getWordText(word2!)).toBe("second");
+    });
+  });
+  describe("Helper integration", () => {
+    it("getFirstWord should match first result from getAllWords", () => {
+      const words = [
+        createGLOSTWordNode({ value: "alpha", lang: "en", script: "latin" }),
+        createGLOSTWordNode({ value: "beta", lang: "en", script: "latin" }),
+        createGLOSTWordNode({ value: "gamma", lang: "en", script: "latin" }),
+      ];
+      const doc = createSimpleDocument(words, "en", "latin");
+      const firstWord = getFirstWord(doc);
+      const allWords = getAllWords(doc);
+      expect(firstWord).toBe(allWords[0]);
+      expect(getWordText(firstWord!)).toBe(getWordText(allWords[0]));
+    });
+    it("getWordAtPath should match getAllWords result by index", () => {
+      const words = [
+        createGLOSTWordNode({ value: "one", lang: "en", script: "latin" }),
+        createGLOSTWordNode({ value: "two", lang: "en", script: "latin" }),
+        createGLOSTWordNode({ value: "three", lang: "en", script: "latin" }),
+      ];
+      const doc = createSimpleDocument(words, "en", "latin");
+      const allWords = getAllWords(doc);
+      const wordAtPath1 = getWordAtPath(doc, { paragraph: 0, sentence: 0, word: 1 });
+      expect(wordAtPath1).toBe(allWords[1]);
+      expect(getWordText(wordAtPath1!)).toBe("two");
+    });
+  });
+});