@omnimedia/omnitool 1.1.0-1 → 1.1.0-10

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (222) hide show
  1. package/README.md +1 -1
  2. package/package.json +12 -9
  3. package/s/context.ts +1 -1
  4. package/s/demo/demo.bundle.ts +6 -2
  5. package/s/demo/demo.css +5 -0
  6. package/s/demo/routines/filmstrip-test.ts +2 -2
  7. package/s/demo/routines/transcode-test.ts +4 -2
  8. package/s/demo/routines/transcriber-test.ts +34 -0
  9. package/s/demo/routines/transitions-test.ts +43 -0
  10. package/s/driver/driver.ts +17 -9
  11. package/s/driver/fns/host.ts +7 -6
  12. package/s/driver/fns/schematic.ts +45 -22
  13. package/s/driver/fns/work.ts +163 -151
  14. package/s/driver/utils/load-decoder-source.ts +3 -4
  15. package/s/features/speech/transcribe/default-spec.ts +11 -0
  16. package/s/features/speech/transcribe/parts/load-pipe.ts +19 -0
  17. package/s/features/speech/transcribe/parts/prep-audio.ts +23 -0
  18. package/s/features/speech/transcribe/parts/transcribe.ts +70 -0
  19. package/s/features/speech/transcribe/transcriber.ts +46 -0
  20. package/s/features/speech/transcribe/types.ts +82 -0
  21. package/s/features/speech/transcribe/worker.bundle.ts +40 -0
  22. package/s/features/transition/parts/fragment.ts +24 -0
  23. package/s/features/transition/parts/types.ts +94 -0
  24. package/s/features/transition/parts/uniforms.ts +29 -0
  25. package/s/features/transition/parts/vertex.ts +31 -0
  26. package/s/features/transition/transition.ts +60 -0
  27. package/s/index.html.ts +6 -1
  28. package/s/timeline/index.ts +1 -0
  29. package/s/timeline/parts/basics.ts +1 -1
  30. package/s/timeline/parts/compositor/export.ts +77 -0
  31. package/s/timeline/parts/compositor/parts/html-tree.ts +37 -0
  32. package/s/timeline/parts/compositor/parts/schedulers.ts +85 -0
  33. package/s/timeline/parts/compositor/parts/tree-builder.ts +184 -0
  34. package/s/timeline/parts/compositor/parts/webcodecs-tree.ts +30 -0
  35. package/s/timeline/parts/compositor/playback.ts +81 -0
  36. package/s/timeline/parts/compositor/samplers/html.ts +115 -0
  37. package/s/timeline/parts/compositor/samplers/webcodecs.ts +60 -0
  38. package/s/timeline/parts/item.ts +38 -6
  39. package/s/timeline/parts/media.ts +21 -0
  40. package/s/timeline/parts/waveform.ts +1 -1
  41. package/s/timeline/sugar/builders.ts +102 -0
  42. package/s/timeline/sugar/o.ts +117 -27
  43. package/s/timeline/sugar/omni-test.ts +2 -2
  44. package/s/timeline/sugar/omni.ts +21 -11
  45. package/s/timeline/types.ts +29 -0
  46. package/s/timeline/utils/audio-stream.ts +15 -0
  47. package/s/timeline/utils/checksum.ts +2 -1
  48. package/s/timeline/utils/matrix.ts +33 -0
  49. package/s/timeline/utils/video-cursor.ts +40 -0
  50. package/s/tools/common/loader.ts +26 -0
  51. package/s/tools/common/transformer-pipeline.ts +26 -0
  52. package/s/tools/speech-recognition/common/model.ts +26 -0
  53. package/s/tools/speech-recognition/whisper/fns/host.ts +25 -0
  54. package/s/tools/speech-recognition/whisper/fns/schematic.ts +23 -0
  55. package/s/tools/speech-recognition/whisper/fns/work.ts +91 -0
  56. package/s/tools/speech-recognition/whisper/parts/types.ts +38 -0
  57. package/s/tools/speech-recognition/whisper/parts/worker.bundle.ts +7 -0
  58. package/s/tools/speech-recognition/whisper/tool.ts +70 -0
  59. package/x/context.js +1 -1
  60. package/x/context.js.map +1 -1
  61. package/x/demo/demo.bundle.js +6 -2
  62. package/x/demo/demo.bundle.js.map +1 -1
  63. package/x/demo/demo.bundle.min.js +39 -37
  64. package/x/demo/demo.bundle.min.js.map +4 -4
  65. package/x/demo/demo.css +5 -0
  66. package/x/demo/routines/filmstrip-test.d.ts +1 -1
  67. package/x/demo/routines/filmstrip-test.js +2 -2
  68. package/x/demo/routines/filmstrip-test.js.map +1 -1
  69. package/x/demo/routines/transcode-test.js +4 -2
  70. package/x/demo/routines/transcode-test.js.map +1 -1
  71. package/x/demo/routines/transcriber-test.d.ts +4 -0
  72. package/x/demo/routines/transcriber-test.js +33 -0
  73. package/x/demo/routines/transcriber-test.js.map +1 -0
  74. package/x/demo/routines/transitions-test.d.ts +5 -0
  75. package/x/demo/routines/transitions-test.js +35 -0
  76. package/x/demo/routines/transitions-test.js.map +1 -0
  77. package/x/driver/driver.d.ts +3 -5
  78. package/x/driver/driver.js +16 -9
  79. package/x/driver/driver.js.map +1 -1
  80. package/x/driver/driver.worker.bundle.min.js +2537 -148
  81. package/x/driver/driver.worker.bundle.min.js.map +4 -4
  82. package/x/driver/fns/host.d.ts +9 -2
  83. package/x/driver/fns/host.js +3 -3
  84. package/x/driver/fns/host.js.map +1 -1
  85. package/x/driver/fns/schematic.d.ts +39 -21
  86. package/x/driver/fns/work.d.ts +11 -4
  87. package/x/driver/fns/work.js +111 -102
  88. package/x/driver/fns/work.js.map +1 -1
  89. package/x/driver/utils/load-decoder-source.d.ts +2 -1
  90. package/x/driver/utils/load-decoder-source.js +2 -3
  91. package/x/driver/utils/load-decoder-source.js.map +1 -1
  92. package/x/features/speech/transcribe/default-spec.d.ts +2 -0
  93. package/x/features/speech/transcribe/default-spec.js +8 -0
  94. package/x/features/speech/transcribe/default-spec.js.map +1 -0
  95. package/x/features/speech/transcribe/parts/load-pipe.d.ts +2 -0
  96. package/x/features/speech/transcribe/parts/load-pipe.js +13 -0
  97. package/x/features/speech/transcribe/parts/load-pipe.js.map +1 -0
  98. package/x/features/speech/transcribe/parts/prep-audio.d.ts +5 -0
  99. package/x/features/speech/transcribe/parts/prep-audio.js +21 -0
  100. package/x/features/speech/transcribe/parts/prep-audio.js.map +1 -0
  101. package/x/features/speech/transcribe/parts/transcribe.d.ts +5 -0
  102. package/x/features/speech/transcribe/parts/transcribe.js +56 -0
  103. package/x/features/speech/transcribe/parts/transcribe.js.map +1 -0
  104. package/x/features/speech/transcribe/transcriber.d.ts +5 -0
  105. package/x/features/speech/transcribe/transcriber.js +33 -0
  106. package/x/features/speech/transcribe/transcriber.js.map +1 -0
  107. package/x/features/speech/transcribe/types.d.ts +66 -0
  108. package/x/features/speech/transcribe/types.js +2 -0
  109. package/x/features/speech/transcribe/types.js.map +1 -0
  110. package/x/features/speech/transcribe/worker.bundle.d.ts +1 -0
  111. package/x/features/speech/transcribe/worker.bundle.js +33 -0
  112. package/x/features/speech/transcribe/worker.bundle.js.map +1 -0
  113. package/x/features/speech/transcribe/worker.bundle.min.js +2916 -0
  114. package/x/features/speech/transcribe/worker.bundle.min.js.map +7 -0
  115. package/x/features/transition/parts/fragment.d.ts +1 -0
  116. package/x/features/transition/parts/fragment.js +25 -0
  117. package/x/features/transition/parts/fragment.js.map +1 -0
  118. package/x/features/transition/parts/types.d.ts +23 -0
  119. package/x/features/transition/parts/types.js +2 -0
  120. package/x/features/transition/parts/types.js.map +1 -0
  121. package/x/features/transition/parts/uniforms.d.ts +31 -0
  122. package/x/features/transition/parts/uniforms.js +27 -0
  123. package/x/features/transition/parts/uniforms.js.map +1 -0
  124. package/x/features/transition/parts/vertex.d.ts +1 -0
  125. package/x/features/transition/parts/vertex.js +32 -0
  126. package/x/features/transition/parts/vertex.js.map +1 -0
  127. package/x/features/transition/transition.d.ts +5 -0
  128. package/x/features/transition/transition.js +50 -0
  129. package/x/features/transition/transition.js.map +1 -0
  130. package/x/index.html +13 -3
  131. package/x/index.html.js +6 -1
  132. package/x/index.html.js.map +1 -1
  133. package/x/timeline/index.d.ts +1 -0
  134. package/x/timeline/index.js +1 -0
  135. package/x/timeline/index.js.map +1 -1
  136. package/x/timeline/parts/basics.d.ts +1 -1
  137. package/x/timeline/parts/compositor/export.d.ts +9 -0
  138. package/x/timeline/parts/compositor/export.js +64 -0
  139. package/x/timeline/parts/compositor/export.js.map +1 -0
  140. package/x/timeline/parts/compositor/parts/html-tree.d.ts +3 -0
  141. package/x/timeline/parts/compositor/parts/html-tree.js +40 -0
  142. package/x/timeline/parts/compositor/parts/html-tree.js.map +1 -0
  143. package/x/timeline/parts/compositor/parts/schedulers.d.ts +15 -0
  144. package/x/timeline/parts/compositor/parts/schedulers.js +64 -0
  145. package/x/timeline/parts/compositor/parts/schedulers.js.map +1 -0
  146. package/x/timeline/parts/compositor/parts/tree-builder.d.ts +37 -0
  147. package/x/timeline/parts/compositor/parts/tree-builder.js +147 -0
  148. package/x/timeline/parts/compositor/parts/tree-builder.js.map +1 -0
  149. package/x/timeline/parts/compositor/parts/webcodecs-tree.d.ts +3 -0
  150. package/x/timeline/parts/compositor/parts/webcodecs-tree.js +28 -0
  151. package/x/timeline/parts/compositor/parts/webcodecs-tree.js.map +1 -0
  152. package/x/timeline/parts/compositor/playback.d.ts +19 -0
  153. package/x/timeline/parts/compositor/playback.js +71 -0
  154. package/x/timeline/parts/compositor/playback.js.map +1 -0
  155. package/x/timeline/parts/compositor/samplers/html.d.ts +3 -0
  156. package/x/timeline/parts/compositor/samplers/html.js +106 -0
  157. package/x/timeline/parts/compositor/samplers/html.js.map +1 -0
  158. package/x/timeline/parts/compositor/samplers/webcodecs.d.ts +2 -0
  159. package/x/timeline/parts/compositor/samplers/webcodecs.js +55 -0
  160. package/x/timeline/parts/compositor/samplers/webcodecs.js.map +1 -0
  161. package/x/timeline/parts/item.d.ts +34 -8
  162. package/x/timeline/parts/item.js +6 -3
  163. package/x/timeline/parts/item.js.map +1 -1
  164. package/x/timeline/parts/media.d.ts +3 -0
  165. package/x/timeline/parts/media.js +17 -0
  166. package/x/timeline/parts/media.js.map +1 -1
  167. package/x/timeline/parts/waveform.js +1 -1
  168. package/x/timeline/parts/waveform.js.map +1 -1
  169. package/x/timeline/sugar/builders.d.ts +1 -0
  170. package/x/timeline/sugar/builders.js +104 -0
  171. package/x/timeline/sugar/builders.js.map +1 -0
  172. package/x/timeline/sugar/o.d.ts +23 -5
  173. package/x/timeline/sugar/o.js +93 -27
  174. package/x/timeline/sugar/o.js.map +1 -1
  175. package/x/timeline/sugar/omni-test.js +1 -1
  176. package/x/timeline/sugar/omni-test.js.map +1 -1
  177. package/x/timeline/sugar/omni.d.ts +5 -2
  178. package/x/timeline/sugar/omni.js +17 -9
  179. package/x/timeline/sugar/omni.js.map +1 -1
  180. package/x/timeline/types.d.ts +24 -0
  181. package/x/timeline/types.js +2 -0
  182. package/x/timeline/types.js.map +1 -0
  183. package/x/timeline/utils/audio-stream.d.ts +6 -0
  184. package/x/timeline/utils/audio-stream.js +17 -0
  185. package/x/timeline/utils/audio-stream.js.map +1 -0
  186. package/x/timeline/utils/checksum.js +2 -1
  187. package/x/timeline/utils/checksum.js.map +1 -1
  188. package/x/timeline/utils/matrix.d.ts +8 -0
  189. package/x/timeline/utils/matrix.js +26 -0
  190. package/x/timeline/utils/matrix.js.map +1 -0
  191. package/x/timeline/utils/video-cursor.d.ts +10 -0
  192. package/x/timeline/utils/video-cursor.js +36 -0
  193. package/x/timeline/utils/video-cursor.js.map +1 -0
  194. package/x/tools/common/loader.d.ts +19 -0
  195. package/x/tools/common/loader.js +18 -0
  196. package/x/tools/common/loader.js.map +1 -0
  197. package/x/tools/common/transformer-pipeline.d.ts +8 -0
  198. package/x/tools/common/transformer-pipeline.js +24 -0
  199. package/x/tools/common/transformer-pipeline.js.map +1 -0
  200. package/x/tools/speech-recognition/common/model.d.ts +14 -0
  201. package/x/tools/speech-recognition/common/model.js +16 -0
  202. package/x/tools/speech-recognition/common/model.js.map +1 -0
  203. package/x/tools/speech-recognition/whisper/fns/host.d.ts +13 -0
  204. package/x/tools/speech-recognition/whisper/fns/host.js +19 -0
  205. package/x/tools/speech-recognition/whisper/fns/host.js.map +1 -0
  206. package/x/tools/speech-recognition/whisper/fns/schematic.d.ts +19 -0
  207. package/x/tools/speech-recognition/whisper/fns/schematic.js +2 -0
  208. package/x/tools/speech-recognition/whisper/fns/schematic.js.map +1 -0
  209. package/x/tools/speech-recognition/whisper/fns/work.d.ts +12 -0
  210. package/x/tools/speech-recognition/whisper/fns/work.js +74 -0
  211. package/x/tools/speech-recognition/whisper/fns/work.js.map +1 -0
  212. package/x/tools/speech-recognition/whisper/parts/types.d.ts +31 -0
  213. package/x/tools/speech-recognition/whisper/parts/types.js +2 -0
  214. package/x/tools/speech-recognition/whisper/parts/types.js.map +1 -0
  215. package/x/tools/speech-recognition/whisper/parts/worker.bundle.d.ts +1 -0
  216. package/x/tools/speech-recognition/whisper/parts/worker.bundle.js +4 -0
  217. package/x/tools/speech-recognition/whisper/parts/worker.bundle.js.map +1 -0
  218. package/x/tools/speech-recognition/whisper/parts/worker.bundle.min.js +8 -0
  219. package/x/tools/speech-recognition/whisper/parts/worker.bundle.min.js.map +7 -0
  220. package/x/tools/speech-recognition/whisper/tool.d.ts +12 -0
  221. package/x/tools/speech-recognition/whisper/tool.js +63 -0
  222. package/x/tools/speech-recognition/whisper/tool.js.map +1 -0
@@ -0,0 +1,24 @@
1
+ //@ts-ignore
2
+ import { pipeline } from "https://cdn.jsdelivr.net/npm/@huggingface/transformers@3.7.0/dist/transformers.min.js";
3
+ export class PipelineFactory {
4
+ task;
5
+ instance = null;
6
+ model = null;
7
+ constructor(task) {
8
+ this.task = task;
9
+ }
10
+ async createInstance(model, progressCallback) {
11
+ this.model = model;
12
+ return this.instance = await pipeline(this.task, this.model, {
13
+ dtype: {
14
+ encoder_model: this.model === "onnx-community/whisper-large-v3-turbo"
15
+ ? "fp16"
16
+ : "fp32",
17
+ decoder_model_merged: "q4",
18
+ },
19
+ device: "webgpu",
20
+ progress_callback: progressCallback,
21
+ });
22
+ }
23
+ }
24
+ //# sourceMappingURL=transformer-pipeline.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"transformer-pipeline.js","sourceRoot":"","sources":["../../../s/tools/common/transformer-pipeline.ts"],"names":[],"mappings":"AAAA,YAAY;AACZ,OAAO,EAAC,QAAQ,EAAC,MAAM,uFAAuF,CAAA;AAI9G,MAAM,OAAO,eAAe;IAIR;IAHnB,QAAQ,GAAQ,IAAI,CAAA;IACpB,KAAK,GAAkB,IAAI,CAAA;IAE3B,YAAmB,IAAY;QAAZ,SAAI,GAAJ,IAAI,CAAQ;IAAG,CAAC;IAEnC,KAAK,CAAC,cAAc,CAAC,KAAa,EAAE,gBAAmC;QACtE,IAAI,CAAC,KAAK,GAAG,KAAK,CAAA;QAClB,OAAO,IAAI,CAAC,QAAQ,GAAG,MAAM,QAAQ,CAAC,IAAI,CAAC,IAAI,EAAE,IAAI,CAAC,KAAK,EAAE;YAC5D,KAAK,EAAE;gBACN,aAAa,EACZ,IAAI,CAAC,KAAK,KAAK,uCAAuC;oBACrD,CAAC,CAAC,MAAM;oBACR,CAAC,CAAC,MAAM;gBACV,oBAAoB,EAAE,IAAI;aAC1B;YACD,MAAM,EAAE,QAAQ;YAChB,iBAAiB,EAAE,gBAAgB;SACnC,CAAC,CAAA;IACH,CAAC;CACD"}
@@ -0,0 +1,14 @@
1
+ import { Loader } from "../../common/loader.js";
2
+ import { DecoderSource } from "../../../driver/fns/schematic.js";
3
+ import { SpeechRecognizerModels, Word, WordGroup } from "../whisper/parts/types.js";
4
+ export declare abstract class SpeechRecognizer extends Loader {
5
+ multilingual: boolean;
6
+ static speechRecognizerEvents: {
7
+ onTranscriptionChunk: import("@e280/stz").Pub<Word[]>;
8
+ onTranscribeProgress: import("@e280/stz").Pub<[number]>;
9
+ };
10
+ abstract transcribe(input: DecoderSource): Promise<WordGroup>;
11
+ setMultilingual(value: boolean): void;
12
+ detectLanguage?(input: Blob | AudioBuffer): Promise<string>;
13
+ setModel(value: SpeechRecognizerModels): void;
14
+ }
@@ -0,0 +1,16 @@
1
+ import { pub } from "@e280/stz";
2
+ import { Loader } from "../../common/loader.js";
3
+ export class SpeechRecognizer extends Loader {
4
+ multilingual = true;
5
+ static speechRecognizerEvents = {
6
+ onTranscriptionChunk: pub(),
7
+ onTranscribeProgress: pub()
8
+ };
9
+ setMultilingual(value) {
10
+ this.multilingual = value;
11
+ }
12
+ setModel(value) {
13
+ this.model = value;
14
+ }
15
+ }
16
+ //# sourceMappingURL=model.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"model.js","sourceRoot":"","sources":["../../../../s/tools/speech-recognition/common/model.ts"],"names":[],"mappings":"AAAA,OAAO,EAAC,GAAG,EAAC,MAAM,WAAW,CAAA;AAE7B,OAAO,EAAC,MAAM,EAAC,MAAM,wBAAwB,CAAA;AAI7C,MAAM,OAAgB,gBAAiB,SAAQ,MAAM;IACpD,YAAY,GAAG,IAAI,CAAA;IAEnB,MAAM,CAAC,sBAAsB,GAAG;QAC/B,oBAAoB,EAAE,GAAG,EAAU;QACnC,oBAAoB,EAAE,GAAG,EAAY;KACrC,CAAA;IAID,eAAe,CAAC,KAAc;QAC7B,IAAI,CAAC,YAAY,GAAG,KAAK,CAAA;IAC1B,CAAC;IAID,QAAQ,CAAC,KAA6B;QACrC,IAAI,CAAC,KAAK,GAAG,KAAK,CAAA;IACnB,CAAC"}
@@ -0,0 +1,13 @@
1
+ import { ProgressItem } from "../parts/types.js";
2
+ import { SpeechRecognizerHostEvents } from "./schematic.js";
3
+ export declare const setupWhisperHost: (events: SpeechRecognizerHostEvents) => import("@e280/comrade").SetupHost<{
4
+ work: {
5
+ transcribe(input: import("../parts/types.js").TranscriptionMessage): Promise<import("../parts/types.js").TranscriptionResult | null>;
6
+ };
7
+ host: {
8
+ updateModelLoadProgress(item: ProgressItem): Promise<void>;
9
+ deliverTranscriptionChunk(chunk: import("../parts/types.js").TranscriptionChunk): Promise<void>;
10
+ updateTps(value: number): Promise<void>;
11
+ updateTranscribeProgress(value: number): Promise<void>;
12
+ };
13
+ }>;
@@ -0,0 +1,19 @@
1
+ import { Comrade } from "@e280/comrade";
2
+ export const setupWhisperHost = (events) => (Comrade.host(_shell => ({
3
+ async updateModelLoadProgress(item) {
4
+ events.onModelLoadProgress.pub(item);
5
+ },
6
+ async deliverTranscriptionChunk(chunk) {
7
+ events.onTranscriptionChunk.pub({
8
+ text: chunk.text,
9
+ timestamp: chunk.timestamp
10
+ });
11
+ },
12
+ async updateTps(value) {
13
+ events.onTpsUpdate.pub(value);
14
+ },
15
+ async updateTranscribeProgress(value) {
16
+ events.onTranscribeProgress(value);
17
+ }
18
+ })));
19
+ //# sourceMappingURL=host.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"host.js","sourceRoot":"","sources":["../../../../../s/tools/speech-recognition/whisper/fns/host.ts"],"names":[],"mappings":"AACA,OAAO,EAAC,OAAO,EAAC,MAAM,eAAe,CAAA;AAIrC,MAAM,CAAC,MAAM,gBAAgB,GAAG,CAAC,MAAkC,EAAE,EAAE,CAAC,CACvE,OAAO,CAAC,IAAI,CAAmB,MAAM,CAAC,EAAE,CAAC,CAAC;IACzC,KAAK,CAAC,uBAAuB,CAAC,IAAI;QACjC,MAAM,CAAC,mBAAmB,CAAC,GAAG,CAAC,IAAI,CAAC,CAAA;IACrC,CAAC;IACD,KAAK,CAAC,yBAAyB,CAAC,KAAK;QACpC,MAAM,CAAC,oBAAoB,CAAC,GAAG,CAAC;YAC/B,IAAI,EAAE,KAAK,CAAC,IAAI;YAChB,SAAS,EAAE,KAAK,CAAC,SAAS;SAC1B,CAAC,CAAA;IACH,CAAC;IACD,KAAK,CAAC,SAAS,CAAC,KAAK;QACpB,MAAM,CAAC,WAAW,CAAC,GAAG,CAAC,KAAK,CAAC,CAAA;IAC9B,CAAC;IACD,KAAK,CAAC,wBAAwB,CAAC,KAAK;QACnC,MAAM,CAAC,oBAAoB,CAAC,KAAK,CAAC,CAAA;IACnC,CAAC;CACD,CAAC,CAAC,CACH,CAAA"}
@@ -0,0 +1,19 @@
1
+ import { Pub } from "@e280/stz";
2
+ import { AsSchematic } from "@e280/comrade";
3
+ import { LoaderEvents } from "../../../common/loader.js";
4
+ import { ProgressItem, TranscriptionChunk, TranscriptionMessage, TranscriptionResult, Word } from "../parts/types.js";
5
+ export type WhisperSchematic = AsSchematic<{
6
+ work: {
7
+ transcribe(input: TranscriptionMessage): Promise<TranscriptionResult | null>;
8
+ };
9
+ host: {
10
+ updateModelLoadProgress(item: ProgressItem): Promise<void>;
11
+ deliverTranscriptionChunk(chunk: TranscriptionChunk): Promise<void>;
12
+ updateTps(value: number): Promise<void>;
13
+ updateTranscribeProgress(value: number): Promise<void>;
14
+ };
15
+ }>;
16
+ export interface SpeechRecognizerHostEvents extends LoaderEvents {
17
+ onTranscriptionChunk: Pub<Word[]>;
18
+ onTranscribeProgress: Pub<[number]>;
19
+ }
@@ -0,0 +1,2 @@
1
+ export {};
2
+ //# sourceMappingURL=schematic.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"schematic.js","sourceRoot":"","sources":["../../../../../s/tools/speech-recognition/whisper/fns/schematic.ts"],"names":[],"mappings":""}
@@ -0,0 +1,12 @@
1
+ import { TranscriptionChunk } from "../parts/types.js";
2
+ export declare const setupWhisperWork: import("@e280/comrade").SetupWork<{
3
+ work: {
4
+ transcribe(input: import("../parts/types.js").TranscriptionMessage): Promise<import("../parts/types.js").TranscriptionResult | null>;
5
+ };
6
+ host: {
7
+ updateModelLoadProgress(item: import("../parts/types.js").ProgressItem): Promise<void>;
8
+ deliverTranscriptionChunk(chunk: TranscriptionChunk): Promise<void>;
9
+ updateTps(value: number): Promise<void>;
10
+ updateTranscribeProgress(value: number): Promise<void>;
11
+ };
12
+ }>;
@@ -0,0 +1,74 @@
1
+ import { Comrade } from "@e280/comrade";
2
+ //@ts-ignore
3
+ import { WhisperTextStreamer } from "https://cdn.jsdelivr.net/npm/@huggingface/transformers@3.7.0/dist/transformers.min.js";
4
+ import { PipelineFactory } from "../../../common/transformer-pipeline.js";
5
+ // TODO suspicious globals, probably bad
6
+ const pipeline = new PipelineFactory("automatic-speech-recognition");
7
+ let transcriber;
8
+ export const setupWhisperWork = Comrade.work(shell => ({
9
+ async transcribe({ audio, model, language, duration }) {
10
+ const isDistil = model.startsWith("distil-whisper/");
11
+ if (!pipeline.model || pipeline.model !== model) {
12
+ pipeline.instance?.dispose()?.();
13
+ pipeline.instance = null;
14
+ transcriber = await pipeline.createInstance(model, (data) => {
15
+ if (data.progress)
16
+ shell.host.updateModelLoadProgress({
17
+ id: data.file,
18
+ progress: data.progress
19
+ });
20
+ });
21
+ }
22
+ const timePrecision = transcriber.processor.feature_extractor.config.chunk_length /
23
+ transcriber.model.config.max_source_positions;
24
+ const chunkLength = isDistil ? 20 : 30;
25
+ const strideLength = isDistil ? 3 : 5;
26
+ let chunkCount = 0;
27
+ let startTime = null;
28
+ let tokenCount = 0;
29
+ let tps = 0;
30
+ const chunkDuration = chunkLength - strideLength;
31
+ const estimateProgress = () => {
32
+ const audioProgressSeconds = chunkCount * chunkDuration;
33
+ return Math.min(audioProgressSeconds / duration, 1);
34
+ };
35
+ const streamer = new WhisperTextStreamer(transcriber.tokenizer, {
36
+ time_precision: timePrecision,
37
+ token_callback_function: () => {
38
+ startTime ??= performance.now();
39
+ if (++tokenCount > 1) {
40
+ tps = (tokenCount / (performance.now() - startTime)) * 1000;
41
+ shell.host.updateTps(tps);
42
+ }
43
+ },
44
+ callback_function: (textChunk) => {
45
+ shell.host.deliverTranscriptionChunk(textChunk);
46
+ },
47
+ on_finalize: () => {
48
+ startTime = null;
49
+ tokenCount = 0;
50
+ chunkCount++;
51
+ const progress = estimateProgress();
52
+ shell.host.updateTranscribeProgress(progress);
53
+ },
54
+ });
55
+ const output = await transcriber(audio, {
56
+ top_k: 0,
57
+ do_sample: false,
58
+ chunk_length_s: chunkLength,
59
+ stride_length_s: strideLength,
60
+ language,
61
+ task: "transcribe",
62
+ return_timestamps: "word", // if using "word" the on_chunk_start & end is not called thus we cant retrieve timestamps, only after whole thing finishes
63
+ force_full_sequences: false,
64
+ streamer,
65
+ });
66
+ if (!output)
67
+ return null;
68
+ return {
69
+ tps,
70
+ ...output,
71
+ };
72
+ }
73
+ }));
74
+ //# sourceMappingURL=work.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"work.js","sourceRoot":"","sources":["../../../../../s/tools/speech-recognition/whisper/fns/work.ts"],"names":[],"mappings":"AAAA,OAAO,EAAC,OAAO,EAAC,MAAM,eAAe,CAAA;AACrC,YAAY;AACZ,OAAO,EAAW,mBAAmB,EAAC,MAAM,uFAAuF,CAAA;AAInI,OAAO,EAAC,eAAe,EAAC,MAAM,yCAAyC,CAAA;AAEvE,wCAAwC;AACxC,MAAM,QAAQ,GAAG,IAAI,eAAe,CAAC,8BAA8B,CAAC,CAAA;AACpE,IAAI,WAAgB,CAAA;AAEpB,MAAM,CAAC,MAAM,gBAAgB,GAAG,OAAO,CAAC,IAAI,CAAmB,KAAK,CAAC,EAAE,CAAC,CAAC;IACxE,KAAK,CAAC,UAAU,CAAC,EAAC,KAAK,EAAE,KAAK,EAAE,QAAQ,EAAE,QAAQ,EAAC;QAClD,MAAM,QAAQ,GAAG,KAAK,CAAC,UAAU,CAAC,iBAAiB,CAAC,CAAA;QAEpD,IAAG,CAAC,QAAQ,CAAC,KAAK,IAAI,QAAQ,CAAC,KAAK,KAAK,KAAK,EAAE,CAAC;YAChD,QAAQ,CAAC,QAAQ,EAAE,OAAO,EAAE,EAAE,EAAE,CAAA;YAChC,QAAQ,CAAC,QAAQ,GAAG,IAAI,CAAA;YACxB,WAAW,GAAG,MAAM,QAAQ,CAAC,cAAc,CAC1C,KAAK,EACL,CAAC,IAAI,EAAE,EAAE;gBACR,IAAG,IAAI,CAAC,QAAQ;oBACf,KAAK,CAAC,IAAI,CAAC,uBAAuB,CAAC;wBAClC,EAAE,EAAE,IAAI,CAAC,IAAI;wBACb,QAAQ,EAAE,IAAI,CAAC,QAAQ;qBACvB,CAAC,CAAA;YACJ,CAAC,CACD,CAAA;QACF,CAAC;QAED,MAAM,aAAa,GAClB,WAAW,CAAC,SAAS,CAAC,iBAAiB,CAAC,MAAM,CAAC,YAAY;YAC3D,WAAW,CAAC,KAAK,CAAC,MAAM,CAAC,oBAAoB,CAAA;QAE9C,MAAM,WAAW,GAAG,QAAQ,CAAC,CAAC,CAAC,EAAE,CAAC,CAAC,CAAC,EAAE,CAAA;QACtC,MAAM,YAAY,GAAG,QAAQ,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAA;QAErC,IAAI,UAAU,GAAG,CAAC,CAAA;QAClB,IAAI,SAAS,GAAkB,IAAI,CAAA;QACnC,IAAI,UAAU,GAAG,CAAC,CAAA;QAClB,IAAI,GAAG,GAAG,CAAC,CAAA;QAEX,MAAM,aAAa,GAAG,WAAW,GAAG,YAAY,CAAA;QAEhD,MAAM,gBAAgB,GAAG,GAAG,EAAE;YAC7B,MAAM,oBAAoB,GAAG,UAAU,GAAG,aAAa,CAAA;YACvD,OAAO,IAAI,CAAC,GAAG,CAAC,oBAAoB,GAAG,QAAQ,EAAE,CAAC,CAAC,CAAA;QACpD,CAAC,CAAA;QAED,MAAM,QAAQ,GAAG,IAAI,mBAAmB,CAAC,WAAW,CAAC,SAAS,EAAE;YAC/D,cAAc,EAAE,aAAa;YAC7B,uBAAuB,EAAE,GAAG,EAAE;gBAC7B,SAAS,KAAK,WAAW,CAAC,GAAG,EAAE,CAAA;gBAC/B,IAAI,EAAE,UAAU,GAAG,CAAC,EAAE,CAAC;oBACtB,GAAG,GAAG,CAAC,UAAU,GAAG,CAAC,WAAW,CAAC,GAAG,EAAE,GAAG,SAAS,CAAC,CAAC,GAAG,IAAI,CAAA;oBAC3D,KAAK,CAAC,IAAI,CAAC,SAAS,CAAC,GAAG,CAAC,CAAA;gBAC1B,CAAC;YACF,CAAC;YACD,iBAAiB,EAAE,CAAC,SAAc,EAAE,EAAE;gBACrC,KAAK,CAAC,IAAI,CAAC,yBAAyB,CAAC,SAAS,CAAC,CAAA;YAChD,CAAC;YACD,WAAW,EAAE,GAAG,EAAE;gBACjB,SAAS,GAAG,IAAI,CAAA;gBAChB,UAAU,GAAG,CAAC,CAAA;gBACd,UAAU,EAAE,CAAA;gBACZ,MAAM,QAAQ,GAAG,gBAAgB,EAAE,CAAA;gBACnC,KAAK,CAAC,IAAI,CAAC,wBAAwB,CAAC,QAAQ,CAAC,CAAA;YAC9C,CAAC;SACD,CAAC,CAAA;QAEF,MAAM,MAAM,GAAG,MAAM,WAAW,CAAC,KAAK,EAAE;YACvC,KAAK,EAAE,CAAC;YACR,SAAS,EAAE,KAAK;YAChB,cAAc,EAAE,WAAW;YAC3B,eAAe,EAAE,YAAY;YAC7B,QAAQ;YACR,IAAI,EAAE,YAAY;YAClB,iBAAiB,EAAE,MAAM,EAAE,2HAA2H;YACtJ,oBAAoB,EAAE,KAAK;YAC3B,QAAQ;SACR,CAAC,CAAA;QAEF,IAAI,CAAC,MAAM;YAAE,OAAO,IAAI,CAAA;QAExB,OAAO;YACN,GAAG;YACH,GAAG,MAAM;SACT,CAAA;IACF,CAAC;CACD,CAAC,CAAC,CAAA"}
@@ -0,0 +1,31 @@
1
+ export interface ProgressItem {
2
+ id: string;
3
+ progress: number;
4
+ }
5
+ export type Word = {
6
+ text: string;
7
+ timestamp: [start: number, end: number];
8
+ };
9
+ export type WordGroup = Word[];
10
+ export type Transcript = WordGroup[];
11
+ export interface TranscriptionChunk {
12
+ text: string;
13
+ offset: number;
14
+ timestamp: [number, number];
15
+ finalised: boolean;
16
+ }
17
+ export interface TranscriptionMessage {
18
+ audio: Float32Array;
19
+ model: string;
20
+ subtask: string | null;
21
+ language: string | null;
22
+ duration: number;
23
+ }
24
+ export interface TranscriptionResult {
25
+ text: string;
26
+ chunks: TranscriptionChunk[];
27
+ tps: number;
28
+ }
29
+ export type ProgressCallback = (data: any) => void;
30
+ export type SpeechRecognizerModels = "onnx-community/whisper-tiny_timestamped";
31
+ export type SpeechRecognizerSubtasks = "transcribe";
@@ -0,0 +1,2 @@
1
+ export {};
2
+ //# sourceMappingURL=types.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"types.js","sourceRoot":"","sources":["../../../../../s/tools/speech-recognition/whisper/parts/types.ts"],"names":[],"mappings":""}
@@ -0,0 +1,4 @@
1
+ import { Comrade } from "@e280/comrade";
2
+ import { setupWhisperWork } from "../fns/work.js";
3
+ await Comrade.worker(setupWhisperWork);
4
+ //# sourceMappingURL=worker.bundle.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"worker.bundle.js","sourceRoot":"","sources":["../../../../../s/tools/speech-recognition/whisper/parts/worker.bundle.ts"],"names":[],"mappings":"AAAA,OAAO,EAAC,OAAO,EAAC,MAAM,eAAe,CAAA;AAErC,OAAO,EAAC,gBAAgB,EAAC,MAAM,gBAAgB,CAAA;AAG/C,MAAM,OAAO,CAAC,MAAM,CAAmB,gBAAgB,CAAC,CAAA"}
@@ -0,0 +1,8 @@
1
+ function pe(e,t){return{error:r=>e.error({...t,...r}),rpcRequest:r=>e.rpcRequest({...t,...r}),rpcError:r=>e.rpcError({...t,...r})}}var N=()=>e=>({plain:e.none,errMessage:e.mix(e.brightRed,e.bold),errName:e.red,errStack:e.mix(e.red,e.dim),timestamp:e.blue,timestampErr:e.red});function ke(){return N()}var b=Object.freeze({black:"\x1B[30m",red:"\x1B[31m",green:"\x1B[32m",yellow:"\x1B[33m",blue:"\x1B[34m",magenta:"\x1B[35m",cyan:"\x1B[36m",white:"\x1B[37m",brightBlack:"\x1B[90m",brightRed:"\x1B[91m",brightGreen:"\x1B[92m",brightYellow:"\x1B[93m",brightBlue:"\x1B[94m",brightMagenta:"\x1B[95m",brightCyan:"\x1B[96m",brightWhite:"\x1B[97m",bgBlack:"\x1B[40m",bgRed:"\x1B[41m",bgGreen:"\x1B[42m",bgYellow:"\x1B[43m",bgBlue:"\x1B[44m",bgMagenta:"\x1B[45m",bgCyan:"\x1B[46m",bgWhite:"\x1B[47m",bgBrightBlack:"\x1B[100m",bgBrightRed:"\x1B[101m",bgBrightGreen:"\x1B[102m",bgBrightYellow:"\x1B[103m",bgBrightBlue:"\x1B[104m",bgBrightMagenta:"\x1B[105m",bgBrightCyan:"\x1B[106m",bgBrightWhite:"\x1B[107m",bold:"\x1B[1m",dim:"\x1B[2m",italic:"\x1B[3m",underline:"\x1B[4m",inverse:"\x1B[7m",hidden:"\x1B[8m",strikethrough:"\x1B[9m",reset:"\x1B[0m"});var _=()=>({none:e=>e,uncolor:Qe,mix:Ke,hex:Ge,rgb:Se,bgRgb:Xe});function Qe(e){return e.replace(/[\u001b\u009b][[()#;?]*(?:[0-9]{1,4}(?:;[0-9]{0,4})*)?[0-9A-ORZcf-nqry=><]/g,"")}function Ke(...e){return t=>{for(let r of e)t=r(t);return t}}function Ge(e){e=e.replace(/^#/,"");let t,r,o,n;if(e.length===3)t=parseInt(e.split("").map(s=>s+s).join(""),16);else if(e.length===6)t=parseInt(e,16);else throw new Error("Invalid hex color");return r=t>>16&255,o=t>>8&255,n=t&255,Se(r,o,n)}function Se(e,t,r){let o=`\x1B[38;2;${e};${t};${r}m`;return n=>`${o}${n}${b.reset}`}function Xe(e,t,r){let o=`\x1B[48;2;${e};${t};${r}m`;return n=>`${o}${n}${b.reset}`}var A={...Object.fromEntries(Object.entries(b).map(([e])=>[e,t=>t])),..._()};var P={...Object.fromEntries(Object.entries(b).map(([e,t])=>[e,r=>`${t}${r}${b.reset}`])),..._()};function me(){return typeof Deno<"u"&&typeof Deno.version<"u"}function le(){return typeof process<"u"&&process.versions&&process.versions.node}function Ee(){return le()?process.env.FORCE_COLOR||process.stdout.isTTY&&process.env.TERM!=="dumb":me()?Deno.env.get("FORCE_COLOR")||Deno.isatty(Deno.stdout.rid)&&Deno.env.get("TERM")!=="dumb":!1}var de=()=>Ee()?P:A;var L=()=>({colors:e,theme:t})=>{let r=t(e);function o(i){let c=i.stack?`
2
+ `+i.stack+`
3
+ `:"";return[r.errName(i.name+":"),r.errMessage(i.message)].join(" ")+r.errStack(c)}function n(i){return i&&i instanceof Error?o(i):i}function s(i){return i&&i instanceof Error?o(i):r.errMessage(i)}return{stdout:i=>i.map(n),stderr:i=>i.map(s)}};function M(...e){return t=>({stdout:r=>{for(let o of e)r=o(t).stdout(r);return r},stderr:r=>{for(let o of e)r=o(t).stderr(r);return r}})}function et(){return{icon:"\u{1F6A8}",now:()=>Date.now()}}var V=e=>({colors:t,theme:r})=>{let o={...et(),...e},n=r(t),s=new Date(o.now()),i=s.getUTCFullYear().toString().padStart(4,"0"),c=(s.getUTCMonth()+1).toString().padStart(2,"0"),a=s.getUTCDate().toString().padStart(2,"0"),u=`${i}-${c}-${a}`,f=s.getUTCHours().toString().padStart(2,"0"),p=s.getUTCMinutes().toString().padStart(2,"0"),z=s.getUTCSeconds().toString().padStart(2,"0"),ue=s.getUTCMilliseconds().toString().padStart(3,"0"),fe=`${f}:${p}:${z}.${ue}`,U=`${u}::${fe}`;return{stdout:O=>[n.timestamp(U),...O],stderr:O=>[n.timestampErr(U),...[o.icon].filter(Boolean),...O]}};function je(){return M(L(),V())}var Y=()=>({stdout:async e=>{await Deno.stdout.write(new TextEncoder().encode(e+`
4
+ `))},stderr:async e=>{await Deno.stderr.write(new TextEncoder().encode(e+`
5
+ `))}});var Z=()=>({stdout:async e=>void process.stdout.write(e+`
6
+ `),stderr:async e=>void process.stderr.write(e+`
7
+ `)});var J=()=>({stdout:async e=>console.log(e),stderr:async e=>console.error(e)});var Te=()=>me()?Y():le()?Z():J();var Oe=()=>({stdout:async()=>{},stderr:async()=>{}});function Re(){return()=>({stdout:e=>e,stderr:e=>e})}var R=class e{static writers={auto:Te,void:Oe,deno:Y,node:Z,console:J};static colors={auto:de,colorful:()=>P,colorless:()=>A};static themes={auto:ke,basic:N};static shapers={auto:je,none:Re,errors:L,timestamp:V};writer=e.writers.auto();colors=e.colors.auto();theme=e.themes.auto();shaper=e.shapers.auto();async log(...t){await this.writer.stdout(this.shaper(this).stdout(t).join(" "))}async error(...t){await this.writer.stderr(this.shaper(this).stderr(t).join(" "))}setWriter(t){return this.writer=t,this}setColors(t){return this.colors=t,this}setTheme(t){return this.theme=t,this}setShaper(...t){return this.shaper=M(...t),this}};var $=class extends R{static dummy(){return new this().setWriter(R.writers.void())}rpcRequest=async({request:t,...r})=>{let o=this.colors.none;this.log(...this.#e(r),o(`${t.method}()`))};rpcError=async({request:t,error:r,...o})=>{this.error(...this.#e(o),`${t.method}()`,r)};#e({meta:t,label:r,remote:o}){let n=this.colors.mix(this.colors.blue,this.colors.dim),s=this.colors.mix(this.colors.cyan,this.colors.dim);return[t?this.#t(t):void 0,r||void 0,o===void 0?void 0:o?n("<-"):s("->")].filter(Boolean)}#t(t){let{headers:r}=t.request;return[this.colors.yellow(`[${t.ip}]`),this.colors.green(r.origin?r.origin:"(no-origin)")].join(" ")}};var m=class extends ${rpcRequest=async()=>{}};var l=Object.freeze({eq(e,t){if(e.length!==t.length)return!1;for(let r=0;r<=e.length;r++)if(e.at(r)!==t.at(r))return!1;return!0},random(e){return crypto.getRandomValues(new Uint8Array(e))}});var B=Object.freeze({fromBytes(e){return[...e].map(t=>t.toString(16).padStart(2,"0")).join("")},toBytes(e){if(e.length%2!==0)throw new Error("must have even number of hex characters");let t=new Uint8Array(e.length/2);for(let r=0;r<e.length;r+=2)t[r/2]=parseInt(e.slice(r,r+2),16);return t},random(e=32){return this.fromBytes(l.random(e))},string(e){return B.fromBytes(e)},bytes(e){return B.toBytes(e)}});var he=58,Q="123456789ABCDEFGHJKLMNPQRSTUVWXYZabcdefghijkmnopqrstuvwxyz",ge=Object.freeze({fromBytes(e){let t=BigInt("0x"+B.fromBytes(e)),r="";for(;t>0;){let o=t%BigInt(he);t=t/BigInt(he),r=Q[Number(o)]+r}for(let o of e)if(o===0)r=Q[0]+r;else break;return r},toBytes(e){let t=BigInt(0);for(let i of e){let c=Q.indexOf(i);if(c===-1)throw new Error(`Invalid character '${i}' in base58 string`);t=t*BigInt(he)+BigInt(c)}let r=t.toString(16);r.length%2!==0&&(r="0"+r);let o=B.toBytes(r),n=0;for(let i of e)if(i===Q[0])n++;else break;let s=new Uint8Array(n+o.length);return s.set(o,n),s},random(e=32){return this.fromBytes(l.random(e))},string(e){return ge.fromBytes(e)},bytes(e){return ge.toBytes(e)}});var Ce=class{lexicon;static lexicons=Object.freeze({base2:{characters:"01"},hex:{characters:"0123456789abcdef"},base36:{characters:"0123456789abcdefghijklmnopqrstuvwxyz"},base58:{characters:"123456789ABCDEFGHJKLMNPQRSTUVWXYZabcdefghijkmnopqrstuvwxyz"},base62:{characters:"0123456789ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz"},base64url:{negativePrefix:"~",characters:"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-_"},base64:{characters:"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+/",padding:{character:"=",size:4}}});lookup;negativePrefix;constructor(t){this.lexicon=t,this.lookup=Object.fromEntries([...t.characters].map((r,o)=>[r,o])),this.negativePrefix=t.negativePrefix??"-"}toBytes(t){let r=Math.log2(this.lexicon.characters.length);if(Number.isInteger(r)){let c=0,a=0,u=[];for(let f of t){if(f===this.lexicon.padding?.character)continue;let p=this.lookup[f];if(p===void 0)throw new Error(`Invalid character: ${f}`);for(c=c<<r|p,a+=r;a>=8;)a-=8,u.push(c>>a&255)}return new Uint8Array(u)}let o=0n,n=BigInt(this.lexicon.characters.length),s=!1;t.startsWith(this.negativePrefix)&&(t=t.slice(this.negativePrefix.length),s=!0);for(let c of t){let a=this.lookup[c];if(a===void 0)throw new Error(`Invalid character: ${c}`);o=o*n+BigInt(a)}let i=[];for(;o>0n;)i.unshift(Number(o%256n)),o=o/256n;return new Uint8Array(i)}fromBytes(t){let r=Math.log2(this.lexicon.characters.length);if(Number.isInteger(r)){let i=0,c=0,a="";for(let u of t)for(i=i<<8|u,c+=8;c>=r;){c-=r;let f=i>>c&(1<<r)-1;a+=this.lexicon.characters[f]}if(c>0){let u=i<<r-c&(1<<r)-1;a+=this.lexicon.characters[u]}if(this.lexicon.padding)for(;a.length%this.lexicon.padding.size!==0;)a+=this.lexicon.padding.character;return a}let o=0n;for(let i of t)o=(o<<8n)+BigInt(i);if(o===0n)return this.lexicon.characters[0];let n=BigInt(this.lexicon.characters.length),s="";for(;o>0n;)s=this.lexicon.characters[Number(o%n)]+s,o=o/n;return s}toInteger(t){if(!t)return 0;let r=0n,o=!1,n=BigInt(this.lexicon.characters.length);t.startsWith(this.negativePrefix)&&(t=t.slice(this.negativePrefix.length),o=!0);for(let s of t){let i=this.lookup[s];if(i===void 0)throw new Error(`Invalid character: ${s}`);r=r*n+BigInt(i)}return Number(o?-r:r)}fromInteger(t){t=Math.floor(t);let r=t<0,o=BigInt(r?-t:t);if(o===0n)return this.lexicon.characters[0];let n=BigInt(this.lexicon.characters.length),s="";for(;o>0n;)s=this.lexicon.characters[Number(o%n)]+s,o=o/n;return r?`${this.negativePrefix}${s}`:s}random(t=32){return this.fromBytes(l.random(t))}};var xe=Object.freeze({fromBytes(e){return typeof btoa=="function"?btoa(String.fromCharCode(...e)):Buffer.from(e).toString("base64")},toBytes(e){return typeof atob=="function"?Uint8Array.from(atob(e),t=>t.charCodeAt(0)):Uint8Array.from(Buffer.from(e,"base64"))},random(e=32){return this.fromBytes(l.random(e))},string(e){return xe.fromBytes(e)},bytes(e){return xe.toBytes(e)}});var Ie=Object.freeze({fromBytes(e){return new TextDecoder().decode(e)},toBytes(e){return new TextEncoder().encode(e)},string(e){return Ie.fromBytes(e)},bytes(e){return Ie.toBytes(e)}});var K=Object.freeze({set:e=>e!=null,unset:e=>e==null,boolean:e=>typeof e=="boolean",number:e=>typeof e=="number",string:e=>typeof e=="string",bigint:e=>typeof e=="bigint",object:e=>typeof e=="object"&&e!==null,array:e=>Array.isArray(e),fn:e=>typeof e=="function",symbol:e=>typeof e=="symbol"});var D=class extends Error{milliseconds;name=this.constructor.name;constructor(t){super(`deadline exceeded (${(t/1e3).toFixed(1)} seconds)`),this.milliseconds=t}};function G(e,t){return e<=0||e===1/0?t():new Promise((r,o)=>{let n=setTimeout(()=>o(new D(e)),e);t().then(r).catch(o).finally(()=>clearTimeout(n))})}function v(){let e,t,r=new Promise((n,s)=>{e=n,t=s});function o(n){return n.then(e).catch(t),r}return{promise:r,resolve:e,reject:t,entangle:o}}function ze(e,t){let r=e;for(let o of t)if(r=r[o],K.unset(r))break;return r}function tt(e){return{map:t=>Ae(e,t),filter:t=>Pe(e,t)}}tt.pipe=Object.freeze({map:e=>t=>Ae(t,e),filter:e=>t=>Pe(t,e)});var Ae=(e,t)=>Object.fromEntries(Object.entries(e).map(([r,o])=>[r,t(o,r)])),Pe=(e,t)=>Object.fromEntries(Object.entries(e).filter(([r,o])=>t(o,r)));function rt(){let e=new Set;function t(s){return e.add(s),()=>{e.delete(s)}}async function r(...s){await Promise.all([...e].map(i=>i(...s)))}async function o(){let{promise:s,resolve:i}=v(),c=t((...a)=>{i(a),c()});return s}function n(){e.clear()}return t.pub=r,t.sub=t,t.on=t,t.next=o,t.clear=n,r.pub=r,r.sub=t,r.on=t,r.next=o,r.clear=n,[r,t]}function X(e){let t=rt()[0];return e&&t.sub(e),t}var g=class{#e=[];add(...t){return this.#e.push(...t),this}disposable(t){return this.bag(t,()=>t.dispose())}bag(t,r){return this.add(()=>r(t)),t}dispose(){for(let t of this.#e.reverse())t();this.#e=[]}};var w;(function(e){e.version="2.0";function t(r){return"id"in r?r.id:null}e.getId=t,e.errorCodes={serverError:-32e3,unexposedError:-32001}})(w||(w={}));var ee=class extends Error{name=this.constructor.name},k=class extends Error{name=this.constructor.name};async function Me({tap:e,request:t,action:r}){let o=w.getId(t);try{let n=await r();return o===null?null:{id:o,result:n,jsonrpc:w.version}}catch(n){return e.rpcError({request:t,error:n}),o===null?null:{id:o,jsonrpc:w.version,error:n instanceof ee?{code:w.errorCodes.serverError,message:n.message}:{code:w.errorCodes.unexposedError,message:"unexposed error"}}}}function te(e){let t=e.tap??new m;return async r=>{let o=r.method.split("."),n=ze(e.fns,o),s=async()=>await n(...r.params);return t.rpcRequest({request:r}),await Me({tap:t,request:r,action:s})}}var $e=Symbol("tune"),ot=Symbol("query"),nt=Symbol("notify"),st=Symbol("settings");function De(e){function t(r){let o={notify:void 0};return new Proxy(()=>{},{apply:(n,s,i)=>e(r,i,o),get:(n,s)=>{if(s!=="then")return s===$e?i=>(...c)=>e(r,c,{...o,...i}):s===nt?(...i)=>e(r,i,{...o,notify:!0}):s===ot?(...i)=>e(r,i,{...o,notify:!1}):s===st?o:(n[s]||(n[s]=t([...r,s])),n[s])},set:(n,s,i)=>(n[s]=i,!0)})}return t([])}function S(e){let{endpoint:t,tap:r=new m}=e,o=1;return De(async(n,s,i)=>{let c=i.notify??e.notify??!1,a=i.transfer,u={jsonrpc:"2.0",method:n.join("."),params:s},f=c?u:{...u,id:o++};r.rpcRequest({request:f});let p=await t(f,{transfer:a});if(c&&!p)return null;if(!p)throw new k("response was null, but shouldn't be, because the request was not a notification");if("error"in p)throw new k(e.label?`${e.label}: ${p.error.message}`:p.error.message);return p.result})}function q(e){return S({endpoint:te(e),tap:e.tap})}var E=class{recv=X();sendRequest=X();sendResponse=X();static makeEntangledPair({origin:t="example.e280.org"}={}){let r=new this,o=new this,n=[r.sendRequest.sub(i=>o.recv(i,{origin:t})),r.sendResponse.sub(i=>o.recv(i,{origin:t})),o.sendRequest.sub(i=>r.recv(i,{origin:t})),o.sendResponse.sub(i=>r.recv(i,{origin:t}))];return[r,o,()=>n.forEach(i=>i())]}};function re(e,t){return e.addEventListener("message",t),()=>e.removeEventListener("message",t)}function qe(e,t){return async(r,{transfer:o}={})=>{if("id"in r){let n=v();return t(r,o,n.promise),e.wait(r.id,r.method).then(s=>(n.resolve(s),s))}else{let n=Promise.resolve(null);return t(r,o,n),n}}}function We(e){let t=[],r=[];for(let o of Array.isArray(e)?e:[e])"method"in o?t.push(o):r.push(o);return{requests:t,responses:r}}async function Fe(e,t){let r=(await Promise.all(t.map(async o=>e(o)))).filter(o=>o!==null);return r.length===0?null:r.length===1?r[0]:r}var C=class extends E{#e=new g;constructor(t){super(),this.#e.add(this.sendRequest.sub((r,o)=>t.postMessage(r,o)),this.sendResponse.sub((r,o)=>t.postMessage(r,o)),re(t,r=>this.recv(r.data,r)))}dispose(){this.#e.dispose()}};var oe=class{remote;transfer;constructor(t){this.remote=t}};var ye=Object.freeze({timeout:6e4,maxRequestBytes:1e7});var ne=class{timeout;pending=new Map;constructor(t){this.timeout=t}async wait(t,r){let o=v();return this.pending.set(t,{method:r,deferred:o}),await G(this.timeout,()=>o.promise).catch(n=>{throw n instanceof D&&(n.message=`request #${t} ${r}(), ${n.message}`),n})}deliverResponse(t){let r=this.pending.get(t.id);r&&("error"in t?r.deferred.reject(new k(t.error.message)):r.deferred.resolve(t))}};var j=class{options;remote;remoteEndpoint;#e;#t=new g;constructor(t){this.options=t;let{conduit:r,tap:o}=t;this.#e=new ne(t.timeout??ye.timeout),this.remoteEndpoint=qe(this.#e,r.sendRequest.pub.bind(r.sendRequest)),this.remote=S({endpoint:this.remoteEndpoint,tap:o&&pe(o,{remote:!0})}),this.#t.add(r.recv.sub(n=>this.recv(n)))}async recv(t){let r=new oe(this.remote),{conduit:o,rpc:n,tap:s}=this.options,{requests:i,responses:c}=We(t);for(let p of c)this.#e.deliverResponse(p);if(!n)return;let a=await n(r),u=te({fns:a,tap:s&&pe(s,{remote:!1})}),f=await Fe(u,i);f&&await o.sendResponse(f,r.transfer)}dispose(){this.#t.dispose()}};var x={derive:{host:e=>({host:e.remote.host,get transfer(){return e.transfer},set transfer(t){e.transfer=t}}),work:e=>({work:e.remote,get transfer(){return e.transfer},set transfer(t){e.transfer=t}})},mock:{host:()=>({host:void 0,transfer:void 0}),work:()=>({work:void 0,transfer:void 0})}};var y=new m;async function He(e,t,r={}){let o=r.tap??y,n=new j({tap:o,timeout:r.timeout??1/0,conduit:new C(e.getSelf()),rpc:async s=>t(x.derive.host(s))});return await n.remote.infra.ready(),n.remote.host}var d=Object.freeze({eq(e,t){if(e.length!==t.length)return!1;for(let r=0;r<=e.length;r++)if(e.at(r)!==t.at(r))return!1;return!0},random(e){return crypto.getRandomValues(new Uint8Array(e))}});var T=Object.freeze({fromBytes(e){return[...e].map(t=>t.toString(16).padStart(2,"0")).join("")},toBytes(e){if(e.length%2!==0)throw new Error("must have even number of hex characters");let t=new Uint8Array(e.length/2);for(let r=0;r<e.length;r+=2)t[r/2]=parseInt(e.slice(r,r+2),16);return t},random(e=32){return this.fromBytes(d.random(e))},string(e){return T.fromBytes(e)},bytes(e){return T.toBytes(e)}});var be=58,se="123456789ABCDEFGHJKLMNPQRSTUVWXYZabcdefghijkmnopqrstuvwxyz",we=Object.freeze({fromBytes(e){let t=BigInt("0x"+T.fromBytes(e)),r="";for(;t>0;){let o=t%BigInt(be);t=t/BigInt(be),r=se[Number(o)]+r}for(let o of e)if(o===0)r=se[0]+r;else break;return r},toBytes(e){let t=BigInt(0);for(let i of e){let c=se.indexOf(i);if(c===-1)throw new Error(`Invalid character '${i}' in base58 string`);t=t*BigInt(be)+BigInt(c)}let r=t.toString(16);r.length%2!==0&&(r="0"+r);let o=T.toBytes(r),n=0;for(let i of e)if(i===se[0])n++;else break;let s=new Uint8Array(n+o.length);return s.set(o,n),s},random(e=32){return this.fromBytes(d.random(e))},string(e){return we.fromBytes(e)},bytes(e){return we.toBytes(e)}});var Ue=class{lexicon;static lexicons=Object.freeze({base2:{characters:"01"},hex:{characters:"0123456789abcdef"},base36:{characters:"0123456789abcdefghijklmnopqrstuvwxyz"},base58:{characters:"123456789ABCDEFGHJKLMNPQRSTUVWXYZabcdefghijkmnopqrstuvwxyz"},base62:{characters:"0123456789ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz"},base64url:{negativePrefix:"~",characters:"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-_"},base64:{characters:"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+/",padding:{character:"=",size:4}}});lookup;negativePrefix;constructor(t){this.lexicon=t,this.lookup=Object.fromEntries([...t.characters].map((r,o)=>[r,o])),this.negativePrefix=t.negativePrefix??"-"}toBytes(t){let r=Math.log2(this.lexicon.characters.length);if(Number.isInteger(r)){let c=0,a=0,u=[];for(let f of t){if(f===this.lexicon.padding?.character)continue;let p=this.lookup[f];if(p===void 0)throw new Error(`Invalid character: ${f}`);for(c=c<<r|p,a+=r;a>=8;)a-=8,u.push(c>>a&255)}return new Uint8Array(u)}let o=0n,n=BigInt(this.lexicon.characters.length),s=!1;t.startsWith(this.negativePrefix)&&(t=t.slice(this.negativePrefix.length),s=!0);for(let c of t){let a=this.lookup[c];if(a===void 0)throw new Error(`Invalid character: ${c}`);o=o*n+BigInt(a)}let i=[];for(;o>0n;)i.unshift(Number(o%256n)),o=o/256n;return new Uint8Array(i)}fromBytes(t){let r=Math.log2(this.lexicon.characters.length);if(Number.isInteger(r)){let i=0,c=0,a="";for(let u of t)for(i=i<<8|u,c+=8;c>=r;){c-=r;let f=i>>c&(1<<r)-1;a+=this.lexicon.characters[f]}if(c>0){let u=i<<r-c&(1<<r)-1;a+=this.lexicon.characters[u]}if(this.lexicon.padding)for(;a.length%this.lexicon.padding.size!==0;)a+=this.lexicon.padding.character;return a}let o=0n;for(let i of t)o=(o<<8n)+BigInt(i);if(o===0n)return this.lexicon.characters[0];let n=BigInt(this.lexicon.characters.length),s="";for(;o>0n;)s=this.lexicon.characters[Number(o%n)]+s,o=o/n;return s}toInteger(t){if(!t)return 0;let r=0n,o=!1,n=BigInt(this.lexicon.characters.length);t.startsWith(this.negativePrefix)&&(t=t.slice(this.negativePrefix.length),o=!0);for(let s of t){let i=this.lookup[s];if(i===void 0)throw new Error(`Invalid character: ${s}`);r=r*n+BigInt(i)}return Number(o?-r:r)}fromInteger(t){t=Math.floor(t);let r=t<0,o=BigInt(r?-t:t);if(o===0n)return this.lexicon.characters[0];let n=BigInt(this.lexicon.characters.length),s="";for(;o>0n;)s=this.lexicon.characters[Number(o%n)]+s,o=o/n;return r?`${this.negativePrefix}${s}`:s}random(t=32){return this.fromBytes(d.random(t))}};var Be=Object.freeze({fromBytes(e){return typeof btoa=="function"?btoa(String.fromCharCode(...e)):Buffer.from(e).toString("base64")},toBytes(e){return typeof atob=="function"?Uint8Array.from(atob(e),t=>t.charCodeAt(0)):Uint8Array.from(Buffer.from(e,"base64"))},random(e=32){return this.fromBytes(d.random(e))},string(e){return Be.fromBytes(e)},bytes(e){return Be.toBytes(e)}});var Ne=Object.freeze({fromBytes(e){return new TextDecoder().decode(e)},toBytes(e){return new TextEncoder().encode(e)},string(e){return Ne.fromBytes(e)},bytes(e){return Ne.toBytes(e)}});var ve=Object.freeze({set:e=>e!=null,unset:e=>e==null,boolean:e=>typeof e=="boolean",number:e=>typeof e=="number",string:e=>typeof e=="string",bigint:e=>typeof e=="bigint",object:e=>typeof e=="object"&&e!==null,array:e=>Array.isArray(e),fn:e=>typeof e=="function",symbol:e=>typeof e=="symbol"});function W(){let e,t,r=new Promise((n,s)=>{e=n,t=s});function o(n){return n.then(e).catch(t),r}return{promise:r,resolve:e,reject:t,entangle:o}}function ut(e){return{map:t=>_e(e,t),filter:t=>Le(e,t)}}ut.pipe=Object.freeze({map:e=>t=>_e(t,e),filter:e=>t=>Le(t,e)});var _e=(e,t)=>Object.fromEntries(Object.entries(e).map(([r,o])=>[r,t(o,r)])),Le=(e,t)=>Object.fromEntries(Object.entries(e).filter(([r,o])=>t(o,r)));var I=class{worker;messenger;constructor(t,r){this.worker=t,this.messenger=r}static async make(t,r){let o=r.tap??y,n=r.label??"comrade",s=t.loadWorker(r.workerUrl,n),i=W(),c={async ready(){i.resolve()}},a=new j({tap:o,timeout:r.timeout??1/0,conduit:new C(s),rpc:async u=>({infra:c,host:r.setupHost(x.derive.work(u))})});return await i.promise,new this(s,a)}get work(){return this.messenger.remote}terminate(){this.worker.terminate()}};var ie=class{threads;static async make(t,r){let o=r.workerCount??t.guessOptimalThreadCount(),n=await Promise.all([...Array(o)].map(async(s,i)=>I.make(t,{...r,label:r.label??`${r.label??"comrade"}_${i+1}`})));return new this(n,{tap:r.tap})}work;#e=new Set;#t=[];constructor(t,r={}){this.threads=t;let o=r.tap??y,n=async(s,i)=>this.#o({request:s,prom:W(),transfer:i?.transfer});this.work=S({tap:o,endpoint:n}),t.forEach(s=>this.#e.add(s))}get threadCount(){return this.threads.length}terminate(){for(let t of this.threads)t.terminate()}#o(t){return this.#t.push(t),this.#r(),t.prom.promise}#r(){for(;this.#e.size>0&&this.#t.length>0;){let t=[...this.#e].pop();this.#e.delete(t);let r=this.#t.shift();this.#e.delete(t);let o=t.messenger.remoteEndpoint(r.request,{transfer:r.transfer});r.prom.entangle(o).finally(()=>{this.#e.add(t),this.#r()})}}};var Ve=e=>({thread:t=>I.make(e,t),cluster:t=>ie.make(e,t),worker:(t,r={})=>He(e,t,r),work:t=>t,host:t=>t,mocks(t){let{setupWork:r,setupHost:o,tap:n=y}=t,s=x.mock.host(),i=x.mock.work();return i.work=q({tap:n,fns:r(s)}),s.host=q({tap:n,fns:o(i)}),{workShell:i,hostShell:s,work:i.work,host:s.host}},mockWork(t,r=y){let o=x.mock.host(),n=x.mock.work();return n.work=q({tap:r,fns:t(o)}),{workShell:n,hostShell:o,work:n.work,mockHost:s=>(o.host=q({tap:r,fns:s(n)}),{workShell:n,hostShell:o,work:n.work,host:o.host})}}});var Ye=()=>({getSelf(){return self},guessOptimalThreadCount(){let e=navigator.hardwareConcurrency??1;return Math.max(1,e-1)},loadWorker(e,t){return new window.Worker(e,{name:t,type:"module"})},async loadWasm(e){return WebAssembly.instantiateStreaming(fetch(e))}});var ft=Ye(),ce=Ve(ft);import{WhisperTextStreamer as mt}from"https://cdn.jsdelivr.net/npm/@huggingface/transformers@3.7.0/dist/transformers.min.js";import{pipeline as pt}from"https://cdn.jsdelivr.net/npm/@huggingface/transformers@3.7.0/dist/transformers.min.js";var ae=class{task;instance=null;model=null;constructor(t){this.task=t}async createInstance(t,r){return this.model=t,this.instance=await pt(this.task,this.model,{dtype:{encoder_model:this.model==="onnx-community/whisper-large-v3-turbo"?"fp16":"fp32",decoder_model_merged:"q4"},device:"webgpu",progress_callback:r})}};var F=new ae("automatic-speech-recognition"),H,Ze=ce.work(e=>({async transcribe({audio:t,model:r,language:o,duration:n}){let s=r.startsWith("distil-whisper/");(!F.model||F.model!==r)&&(F.instance?.dispose()?.(),F.instance=null,H=await F.createInstance(r,h=>{h.progress&&e.host.updateModelLoadProgress({id:h.file,progress:h.progress})}));let i=H.processor.feature_extractor.config.chunk_length/H.model.config.max_source_positions,c=s?20:30,a=s?3:5,u=0,f=null,p=0,z=0,ue=c-a,fe=()=>{let h=u*ue;return Math.min(h/n,1)},U=new mt(H.tokenizer,{time_precision:i,token_callback_function:()=>{f??=performance.now(),++p>1&&(z=p/(performance.now()-f)*1e3,e.host.updateTps(z))},callback_function:h=>{e.host.deliverTranscriptionChunk(h)},on_finalize:()=>{f=null,p=0,u++;let h=fe();e.host.updateTranscribeProgress(h)}}),O=await H(t,{top_k:0,do_sample:!1,chunk_length_s:c,stride_length_s:a,language:o,task:"transcribe",return_timestamps:"word",force_full_sequences:!1,streamer:U});return O?{tps:z,...O}:null}}));await ce.worker(Ze);
8
+ //# sourceMappingURL=worker.bundle.min.js.map