npm - @storyteller-platform/align - Versions diffs - 0.1.9 → 0.1.11 - Mend

@storyteller-platform/align 0.1.9 → 0.1.11

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (113) hide show

package/dist/align/__tests__/align.test.cjs +6 -5
package/dist/align/__tests__/align.test.js +6 -5
package/dist/align/align.cjs +133 -81
package/dist/align/align.d.cts +1 -0
package/dist/align/align.d.ts +1 -0
package/dist/align/align.js +133 -81
package/dist/align/getSentenceRanges.cjs +78 -149
package/dist/align/getSentenceRanges.d.cts +1 -1
package/dist/align/getSentenceRanges.d.ts +1 -1
package/dist/align/getSentenceRanges.js +78 -149
package/dist/align/slugify.cjs +16 -8
package/dist/align/slugify.js +16 -8
package/dist/errorAlign/__tests__/errorAlign.test.cjs +100 -0
package/dist/errorAlign/__tests__/errorAlign.test.d.cts +2 -0
package/dist/errorAlign/__tests__/errorAlign.test.d.ts +2 -0
package/dist/errorAlign/__tests__/errorAlign.test.js +77 -0
package/dist/errorAlign/__tests__/native.test.cjs +118 -0
package/dist/errorAlign/__tests__/native.test.d.cts +2 -0
package/dist/errorAlign/__tests__/native.test.d.ts +2 -0
package/dist/errorAlign/__tests__/native.test.js +107 -0
package/dist/errorAlign/backtraceGraph.cjs +298 -0
package/dist/errorAlign/backtraceGraph.d.cts +103 -0
package/dist/errorAlign/backtraceGraph.d.ts +103 -0
package/dist/errorAlign/backtraceGraph.js +270 -0
package/dist/errorAlign/beamSearch.cjs +302 -0
package/dist/errorAlign/beamSearch.d.cts +53 -0
package/dist/errorAlign/beamSearch.d.ts +53 -0
package/dist/errorAlign/beamSearch.js +268 -0
package/dist/errorAlign/core.cjs +33 -0
package/dist/errorAlign/core.d.cts +5 -0
package/dist/errorAlign/core.d.ts +5 -0
package/dist/errorAlign/core.js +11 -0
package/dist/errorAlign/editDistance.cjs +115 -0
package/dist/errorAlign/editDistance.d.cts +46 -0
package/dist/errorAlign/editDistance.d.ts +46 -0
package/dist/errorAlign/editDistance.js +90 -0
package/dist/errorAlign/errorAlign.cjs +159 -0
package/dist/errorAlign/errorAlign.d.cts +15 -0
package/dist/errorAlign/errorAlign.d.ts +15 -0
package/dist/errorAlign/errorAlign.js +145 -0
package/dist/errorAlign/graphMetadata.cjs +97 -0
package/dist/errorAlign/graphMetadata.d.cts +44 -0
package/dist/errorAlign/graphMetadata.d.ts +44 -0
package/dist/errorAlign/graphMetadata.js +64 -0
package/dist/errorAlign/hash.cjs +173 -0
package/dist/errorAlign/hash.d.cts +28 -0
package/dist/errorAlign/hash.d.ts +28 -0
package/dist/errorAlign/hash.js +150 -0
package/dist/errorAlign/native.cjs +60 -0
package/dist/errorAlign/native.d.cts +18 -0
package/dist/errorAlign/native.d.ts +18 -0
package/dist/errorAlign/native.js +24 -0
package/dist/errorAlign/node-gyp-build.d.cjs +1 -0
package/dist/errorAlign/node-gyp-build.d.d.cts +3 -0
package/dist/errorAlign/node-gyp-build.d.d.ts +3 -0
package/dist/errorAlign/node-gyp-build.d.js +0 -0
package/dist/errorAlign/pathToAlignment.cjs +122 -0
package/dist/errorAlign/pathToAlignment.d.cts +11 -0
package/dist/errorAlign/pathToAlignment.d.ts +11 -0
package/dist/errorAlign/pathToAlignment.js +89 -0
package/dist/errorAlign/utils.cjs +301 -0
package/dist/errorAlign/utils.d.cts +107 -0
package/dist/errorAlign/utils.d.ts +107 -0
package/dist/errorAlign/utils.js +248 -0
package/dist/index.d.cts +1 -0
package/dist/index.d.ts +1 -0
package/dist/markup/__tests__/markup.test.cjs +108 -81
package/dist/markup/__tests__/markup.test.js +109 -82
package/dist/markup/__tests__/parseDom.test.cjs +112 -0
package/dist/markup/__tests__/parseDom.test.d.cts +2 -0
package/dist/markup/__tests__/parseDom.test.d.ts +2 -0
package/dist/markup/__tests__/parseDom.test.js +89 -0
package/dist/markup/__tests__/serializeDom.test.cjs +120 -0
package/dist/markup/__tests__/serializeDom.test.d.cts +2 -0
package/dist/markup/__tests__/serializeDom.test.d.ts +2 -0
package/dist/markup/__tests__/serializeDom.test.js +97 -0
package/dist/markup/__tests__/transform.test.cjs +122 -0
package/dist/markup/__tests__/transform.test.d.cts +2 -0
package/dist/markup/__tests__/transform.test.d.ts +2 -0
package/dist/markup/__tests__/transform.test.js +99 -0
package/dist/markup/map.cjs +261 -0
package/dist/markup/map.d.cts +50 -0
package/dist/markup/map.d.ts +50 -0
package/dist/markup/map.js +236 -0
package/dist/markup/markup.cjs +23 -201
package/dist/markup/markup.d.cts +5 -9
package/dist/markup/markup.d.ts +5 -9
package/dist/markup/markup.js +24 -203
package/dist/markup/model.cjs +172 -0
package/dist/markup/model.d.cts +57 -0
package/dist/markup/model.d.ts +57 -0
package/dist/markup/model.js +145 -0
package/dist/markup/parseDom.cjs +59 -0
package/dist/markup/parseDom.d.cts +7 -0
package/dist/markup/parseDom.d.ts +7 -0
package/dist/markup/parseDom.js +35 -0
package/dist/markup/segmentation.cjs +11 -57
package/dist/markup/segmentation.d.cts +6 -2
package/dist/markup/segmentation.d.ts +6 -2
package/dist/markup/segmentation.js +11 -58
package/dist/markup/serializeDom.cjs +87 -0
package/dist/markup/serializeDom.d.cts +7 -0
package/dist/markup/serializeDom.d.ts +7 -0
package/dist/markup/serializeDom.js +63 -0
package/dist/markup/transform.cjs +92 -0
package/dist/markup/transform.d.cts +11 -0
package/dist/markup/transform.d.ts +11 -0
package/dist/markup/transform.js +71 -0
package/dist/types/node-gyp-build.d.cjs +1 -0
package/dist/types/node-gyp-build.d.d.cts +3 -0
package/dist/types/node-gyp-build.d.d.ts +3 -0
package/dist/types/node-gyp-build.d.js +0 -0
package/package.json +11 -4

package/dist/align/__tests__/align.test.cjs CHANGED Viewed

@@ -131,13 +131,13 @@ async function assertAlignSnapshot(context, epub, transcriptionFilepaths) {
       "utf-8"
     );
     const chapterXml = import_epub.Epub.xhtmlParser.parse(chapterContents);
-    const segmentation = await (0, import_segmentation.getXhtmlSegmentation)(
+    const { result: segmentation } = await (0, import_segmentation.getXhtmlSegmentation)(
       import_epub.Epub.getXhtmlBody(chapterXml),
       {
         primaryLocale: new Intl.Locale("en-US")
       }
     );
-    const chapterSentences = segmentation.sentences.map((s) => s.text);
+    const chapterSentences = segmentation.map((s) => s.text).filter((s) => s.match(/\S/));
     for (const par of import_epub.Epub.getXmlChildren(seq)) {
       newSnapshot += `
 `;
@@ -151,14 +151,14 @@ async function assertAlignSnapshot(context, epub, transcriptionFilepaths) {
       if (sentenceId === void 0) continue;
       const textSentence = chapterSentences[parseInt(sentenceId)];
       if (!textSentence) continue;
-      newSnapshot += `Text:  ${textSentence}
+      newSnapshot += `Text:  ${textSentence.replace(/\n/, "")}
 `;
       const audioSrc = (_d = audio[":@"]) == null ? void 0 : _d["@_src"];
       if (!audioSrc) continue;
       const audioStart = (_e = audio[":@"]) == null ? void 0 : _e["@_clipBegin"];
       const audioEnd = (_f = audio[":@"]) == null ? void 0 : _f["@_clipEnd"];
       if (!audioStart || !audioEnd) continue;
-      const audioStartTime = parseFloat(audioStart.slice(0, -1));
+      const audioStartTime = parseFloat(audioStart.slice(0, -1)) - 2e-3;
       const audioEndTime = parseFloat(audioEnd.slice(0, -1));
       const audioFilename = (0, import_posix.basename)(audioSrc, (0, import_node_path.extname)(audioSrc));
       const transcriptionFilepath = transcriptionFilepaths.find(
@@ -271,7 +271,8 @@ void (0, import_node_test.describe)("align", () => {
         void 0,
         createTestLogger()
       );
-      await aligner.alignBook();
+      const timing = await aligner.alignBook();
+      if (!process.env["CI"]) timing.print();
       await assertAlignSnapshot(context, epub, transcriptionFilepaths);
     } catch (_) {
       var _error = _, _hasError = true;

package/dist/align/__tests__/align.test.js CHANGED Viewed

@@ -67,13 +67,13 @@ async function assertAlignSnapshot(context, epub, transcriptionFilepaths) {
       "utf-8"
     );
     const chapterXml = Epub.xhtmlParser.parse(chapterContents);
-    const segmentation = await getXhtmlSegmentation(
+    const { result: segmentation } = await getXhtmlSegmentation(
       Epub.getXhtmlBody(chapterXml),
       {
         primaryLocale: new Intl.Locale("en-US")
       }
     );
-    const chapterSentences = segmentation.sentences.map((s) => s.text);
+    const chapterSentences = segmentation.map((s) => s.text).filter((s) => s.match(/\S/));
     for (const par of Epub.getXmlChildren(seq)) {
       newSnapshot += `
 `;
@@ -87,14 +87,14 @@ async function assertAlignSnapshot(context, epub, transcriptionFilepaths) {
       if (sentenceId === void 0) continue;
       const textSentence = chapterSentences[parseInt(sentenceId)];
       if (!textSentence) continue;
-      newSnapshot += `Text:  ${textSentence}
+      newSnapshot += `Text:  ${textSentence.replace(/\n/, "")}
 `;
       const audioSrc = (_d = audio[":@"]) == null ? void 0 : _d["@_src"];
       if (!audioSrc) continue;
       const audioStart = (_e = audio[":@"]) == null ? void 0 : _e["@_clipBegin"];
       const audioEnd = (_f = audio[":@"]) == null ? void 0 : _f["@_clipEnd"];
       if (!audioStart || !audioEnd) continue;
-      const audioStartTime = parseFloat(audioStart.slice(0, -1));
+      const audioStartTime = parseFloat(audioStart.slice(0, -1)) - 2e-3;
       const audioEndTime = parseFloat(audioEnd.slice(0, -1));
       const audioFilename = posixBasename(audioSrc, extname(audioSrc));
       const transcriptionFilepath = transcriptionFilepaths.find(
@@ -207,7 +207,8 @@ void describe("align", () => {
         void 0,
         createTestLogger()
       );
-      await aligner.alignBook();
+      const timing = await aligner.alignBook();
+      if (!process.env["CI"]) timing.print();
       await assertAlignSnapshot(context, epub, transcriptionFilepaths);
     } catch (_) {
       var _error = _, _hasError = true;

package/dist/align/align.cjs CHANGED Viewed

@@ -81,7 +81,9 @@ module.exports = __toCommonJS(align_exports);
 var import_promises = require("node:fs/promises");
 var import_node_path = require("node:path");
 var import_posix = require("node:path/posix");
+var import_itertools = require("itertools");
 var import_memoize = __toESM(require("memoize"), 1);
+var import_runes2 = require("runes2");
 var import_audiobook = require("@storyteller-platform/audiobook");
 var import_epub = require("@storyteller-platform/epub");
 var import_ghost_story = require("@storyteller-platform/ghost-story");
@@ -90,7 +92,6 @@ var import_segmentation = require("../markup/segmentation.cjs");
 var import_fuzzy = require("./fuzzy.cjs");
 var import_getSentenceRanges = require("./getSentenceRanges.cjs");
 var import_slugify = require("./slugify.cjs");
-const OFFSET_SEARCH_WINDOW_SIZE = 5e3;
 async function align(input, output, transcriptionsDir, audiobookDir, options) {
   var _stack = [];
   try {
@@ -141,6 +142,7 @@ async function align(input, output, transcriptionsDir, audiobookDir, options) {
 class Aligner {
   constructor(epub, audiofiles, transcriptions, granularity, languageOverride, logger) {
     this.epub = epub;
+    this.audiofiles = audiofiles;
     this.languageOverride = languageOverride;
     this.logger = logger;
     this.transcription = concatTranscriptions(transcriptions, audiofiles);
@@ -155,71 +157,92 @@ class Aligner {
   report = {
     chapters: []
   };
-  findBestOffset(epubSentences, transcriptionText, lastMatchOffset, mapping) {
-    let i = 0;
-    while (i < transcriptionText.length) {
-      let startSentence = 0;
-      const proposedStartIndex = (lastMatchOffset + i) % transcriptionText.length;
-      const proposedEndIndex = (proposedStartIndex + OFFSET_SEARCH_WINDOW_SIZE) % transcriptionText.length;
-      const wrapping = proposedEndIndex < proposedStartIndex;
-      let endIndex = wrapping ? transcriptionText.length : proposedEndIndex;
-      let startIndex = proposedStartIndex;
-      let startSeen = null;
-      let endSeen = null;
-      for (const aligned of this.alignedChapters) {
-        const alignedStart = mapping.map(aligned.startOffset, -1);
-        const alignedEnd = mapping.map(aligned.endOffset, -1);
-        if (startSeen !== null && endSeen === alignedStart) {
-          endSeen = alignedEnd;
-        } else {
-          startSeen = alignedStart;
-          endSeen = alignedEnd;
-        }
-        if (startIndex >= startSeen && startIndex < endSeen) {
-          startIndex = endSeen;
-        }
-        if (endIndex >= startSeen && endIndex <= endSeen) {
-          endIndex = startSeen;
+  findBestOffset(epubSentences, transcriptionText, lastMatchOffset, dir = 1) {
+    const reverse = dir < 0;
+    if (dir < 0) {
+      epubSentences = epubSentences.toReversed().map((s) => (0, import_runes2.runes)(s).toReversed().join(""));
+      transcriptionText = (0, import_runes2.runes)(transcriptionText).toReversed().join("");
+      lastMatchOffset = transcriptionText.length - lastMatchOffset;
+    }
+    const flatSliceIndices = [
+      0,
+      ...this.alignedChapters.toSorted(
+        (a, b) => reverse ? transcriptionText.length - a.endOffset - (transcriptionText.length - b.endOffset) : a.startOffset - b.startOffset
+      ).flatMap((aligned) => [
+        reverse ? transcriptionText.length - aligned.endOffset : aligned.startOffset,
+        reverse ? transcriptionText.length - aligned.startOffset : aligned.endOffset
+      ]),
+      transcriptionText.length
+    ];
+    const sliceIndices = [];
+    for (let i = 0; i < flatSliceIndices.length - 1; i += 2) {
+      sliceIndices.push([flatSliceIndices[i], flatSliceIndices[i + 1]]);
+    }
+    const allSlices = [];
+    let startSlice = 0;
+    for (const [i, [start, end]] of (0, import_itertools.enumerate)(sliceIndices)) {
+      if (lastMatchOffset >= start && lastMatchOffset < end) {
+        if (!reverse) {
+          startSlice = i + 1;
+          allSlices.push({
+            start,
+            text: transcriptionText.slice(start, lastMatchOffset)
+          });
         }
+        allSlices.push({
+          start: lastMatchOffset,
+          text: transcriptionText.slice(lastMatchOffset, end)
+        });
+      } else if (!reverse) {
+        allSlices.push({ start, text: transcriptionText.slice(start, end) });
+      }
+    }
+    const slices = allSlices.filter((slice) => slice.text.length);
+    if (reverse && !slices.length) {
+      const indices = sliceIndices.find(([start]) => start > lastMatchOffset);
+      if (indices) {
+        slices.push({
+          start: indices[0],
+          text: transcriptionText.slice(...indices)
+        });
       }
-      if (startIndex < endIndex) {
-        const transcriptionTextSlice = transcriptionText.slice(
-          startIndex,
-          endIndex
+    }
+    for (const slice of slices.slice(startSlice).concat(slices.slice(0, startSlice))) {
+      let startSentence = 0;
+      while (startSentence < epubSentences.length) {
+        const needle = epubSentences.slice(startSentence, startSentence + 6).join("-");
+        const firstMatch = (0, import_fuzzy.findNearestMatch)(
+          needle,
+          slice.text,
+          Math.max(Math.floor(0.1 * needle.length), 1)
         );
-        while (startSentence < epubSentences.length) {
-          const queryString = epubSentences.slice(startSentence, startSentence + 6).join("-");
-          const firstMatch = (0, import_fuzzy.findNearestMatch)(
-            queryString.toLowerCase(),
-            transcriptionTextSlice.toLowerCase(),
-            Math.max(Math.floor(0.1 * queryString.length), 1)
-          );
-          if (firstMatch) {
-            return {
-              startSentence,
-              transcriptionOffset: (firstMatch.index + startIndex) % transcriptionText.length
-            };
-          }
-          startSentence += 3;
+        if (firstMatch) {
+          const start = reverse ? transcriptionText.length - (slice.start + firstMatch.index) : slice.start + firstMatch.index;
+          return {
+            startSentence: reverse ? epubSentences.length - startSentence : startSentence,
+            transcriptionOffset: start
+          };
         }
+        startSentence += 3;
       }
-      if (wrapping) {
-        i += transcriptionText.length - proposedStartIndex;
-      } else {
-        i += Math.floor(OFFSET_SEARCH_WINDOW_SIZE / 2);
-      }
+    }
+    if (reverse) {
+      return {
+        startSentence: epubSentences.length,
+        transcriptionOffset: slices[0] ? transcriptionText.length - slices[0].start : null
+      };
     }
     return { startSentence: 0, transcriptionOffset: null };
   }
   async getChapterSentences(chapterId) {
     const chapterXml = await this.epub.readXhtmlItemContents(chapterId);
-    const segmentation = await (0, import_segmentation.getXhtmlSegmentation)(
+    const { result: segmentation } = await (0, import_segmentation.getXhtmlSegmentation)(
       import_epub.Epub.getXhtmlBody(chapterXml),
       {
         primaryLocale: this.languageOverride ?? await this.epub.getLanguage()
       }
     );
-    return segmentation.sentences.map((s) => s.text);
+    return segmentation.map((s) => s.text).filter((s) => s.match(/\S/));
   }
   async writeAlignedChapter(alignedChapter) {
     const { chapter, sentenceRanges, xml } = alignedChapter;
@@ -314,7 +337,7 @@ class Aligner {
       }, [])
     });
   }
-  async alignChapter(startSentence, chapterId, transcriptionOffset, locale, lastSentenceRange) {
+  async alignChapter(startSentence, endSentence, chapterId, transcriptionOffset, transcriptionEndOffset, locale, mapping) {
     const timing = (0, import_ghost_story.createTiming)();
     timing.start("read contents");
     const manifest = await this.epub.getManifest();
@@ -331,20 +354,14 @@ class Aligner {
     timing.start("align sentences");
     const { sentenceRanges, transcriptionOffset: endTranscriptionOffset } = await (0, import_getSentenceRanges.getSentenceRanges)(
       startSentence,
+      endSentence,
       this.transcription,
       chapterSentences,
       transcriptionOffset,
-      locale,
-      lastSentenceRange
+      transcriptionEndOffset,
+      locale
     );
     timing.end("align sentences");
-    timing.start("expand ranges");
-    const interpolated = await (0, import_getSentenceRanges.interpolateSentenceRanges)(
-      sentenceRanges,
-      lastSentenceRange
-    );
-    const expanded = (0, import_getSentenceRanges.expandEmptySentenceRanges)(interpolated);
-    timing.end("expand ranges");
     const storytellerStylesheetUrl = (0, import_posix.relative)(
       (0, import_posix.dirname)(chapter.href),
       "Styles/storyteller-readaloud.css"
@@ -357,25 +374,25 @@ class Aligner {
     this.alignedChapters.push({
       chapter,
       xml: chapterXml,
-      sentenceRanges: expanded,
-      startOffset: transcriptionOffset,
-      endOffset: endTranscriptionOffset
+      sentenceRanges,
+      startOffset: mapping.map(transcriptionOffset),
+      endOffset: mapping.map(endTranscriptionOffset, -1)
     });
     this.addChapterReport(
       chapter,
       chapterSentences,
-      expanded,
+      sentenceRanges,
       startSentence,
       transcriptionOffset
     );
     return {
-      lastSentenceRange: expanded[expanded.length - 1] ?? null,
+      lastSentenceRange: sentenceRanges.at(-1) ?? null,
       endTranscriptionOffset,
       timing
     };
   }
   async alignBook(onProgress) {
-    var _a, _b, _c, _d, _e, _f, _g;
+    var _a, _b, _c, _d, _e, _f, _g, _h;
     const locale = this.languageOverride ?? await this.epub.getLanguage() ?? new Intl.Locale("en-US");
     this.timing.setMetadata("language", locale.toString());
     this.timing.setMetadata("granularity", this.granularity);
@@ -386,7 +403,6 @@ class Aligner {
       locale
     );
     let lastTranscriptionOffset = 0;
-    let lastSentenceRange = null;
     for (let index = 0; index < spine.length; index++) {
       onProgress == null ? void 0 : onProgress(index / spine.length);
       const spineItem = spine[index];
@@ -418,36 +434,72 @@ class Aligner {
       const { startSentence, transcriptionOffset: slugifiedOffset } = this.findBestOffset(
         slugifiedChapterSentences,
         transcriptionText,
-        mapping.map(lastTranscriptionOffset, -1),
-        mapping
+        mapping.map(lastTranscriptionOffset, -1)
       );
-      const transcriptionOffset = slugifiedOffset && mapping.invert().map(slugifiedOffset, -1);
-      if (transcriptionOffset === null) {
+      if (slugifiedOffset === null) {
         (_f = this.logger) == null ? void 0 : _f.info(
           `Couldn't find matching transcription for chapter #${index}`
         );
         continue;
       }
-      (_g = this.logger) == null ? void 0 : _g.info(
-        `Chapter #${index} best matches transcription at offset ${transcriptionOffset}, starting at sentence ${startSentence}`
+      const transcriptionOffset = mapping.invert().map(slugifiedOffset, -1);
+      const {
+        startSentence: startEndSentence,
+        transcriptionOffset: slugifiedEndOffset
+      } = this.findBestOffset(
+        slugifiedChapterSentences,
+        transcriptionText,
+        Math.min(
+          transcriptionText.length,
+          slugifiedOffset + Math.round(slugifiedChapterSentences.join("-").length * 1.2)
+        ),
+        -1
+      );
+      const endSentence = startEndSentence;
+      const endOffset = slugifiedEndOffset === null ? this.transcription.transcript.length : mapping.invert().map(slugifiedEndOffset, 1);
+      if (endSentence - startSentence < slugifiedChapterSentences.length / 2) {
+        (_g = this.logger) == null ? void 0 : _g.info(`Found less than half of chapter #${index}, skipping`);
+      }
+      (_h = this.logger) == null ? void 0 : _h.info(
+        `Chapter #${index} best matches transcription from ${transcriptionOffset} to ${endOffset}, from sentence ${startSentence} to ${endSentence} (of ${slugifiedChapterSentences.length}) in the book`
       );
       const result = await this.alignChapter(
         startSentence,
+        endSentence,
         chapterId,
         transcriptionOffset,
+        endOffset,
         locale,
-        lastSentenceRange
+        mapping
       );
-      lastSentenceRange = result.lastSentenceRange;
       lastTranscriptionOffset = result.endTranscriptionOffset;
       this.timing.add(result.timing.summary());
     }
-    if (lastSentenceRange) {
-      lastSentenceRange.end = await (0, import_ffmpeg.getTrackDuration)(
-        lastSentenceRange.audiofile
+    const audioOrderedChapters = this.alignedChapters.toSorted((a, b) => {
+      const firstRangeA = a.sentenceRanges[0];
+      const firstRangeB = b.sentenceRanges[0];
+      if (!firstRangeA) return 1;
+      if (!firstRangeB) return -1;
+      const firstAudiofileIndexA = this.audiofiles.indexOf(
+        firstRangeA.audiofile
       );
-    }
-    for (const alignedChapter of this.alignedChapters) {
+      const firstAudiofileIndexB = this.audiofiles.indexOf(
+        firstRangeB.audiofile
+      );
+      if (firstAudiofileIndexA === firstAudiofileIndexB) {
+        return firstRangeA.start - firstRangeB.start;
+      }
+      return firstAudiofileIndexA - firstAudiofileIndexB;
+    });
+    let lastSentenceRange = null;
+    for (const alignedChapter of audioOrderedChapters) {
+      const interpolated = await (0, import_getSentenceRanges.interpolateSentenceRanges)(
+        alignedChapter.sentenceRanges,
+        lastSentenceRange
+      );
+      const expanded = (0, import_getSentenceRanges.expandEmptySentenceRanges)(interpolated);
+      alignedChapter.sentenceRanges = expanded;
+      lastSentenceRange = expanded.at(-1) ?? null;
       await this.writeAlignedChapter(alignedChapter);
     }
     await this.epub.addMetadata({

package/dist/align/align.d.cts CHANGED Viewed

@@ -37,6 +37,7 @@ interface AlignOptions {
 declare function align(input: string, output: string, transcriptionsDir: string, audiobookDir: string, options: AlignOptions): Promise<_storyteller_platform_ghost_story.TimingAggregator>;
 declare class Aligner {
     epub: Epub;
+    private audiofiles;
     private languageOverride?;
     private logger?;
     private transcription;

package/dist/align/align.d.ts CHANGED Viewed

@@ -37,6 +37,7 @@ interface AlignOptions {
 declare function align(input: string, output: string, transcriptionsDir: string, audiobookDir: string, options: AlignOptions): Promise<_storyteller_platform_ghost_story.TimingAggregator>;
 declare class Aligner {
     epub: Epub;
+    private audiofiles;
     private languageOverride?;
     private logger?;
     private transcription;