react-native-executorch 0.5.1-rc.0 → 0.5.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (178) hide show
  1. package/README.md +132 -0
  2. package/common/rnexecutorch/models/speech_to_text/SpeechToText.cpp +4 -10
  3. package/common/rnexecutorch/models/speech_to_text/SpeechToText.h +1 -1
  4. package/common/rnexecutorch/models/speech_to_text/SpeechToTextStrategy.h +3 -2
  5. package/common/rnexecutorch/models/speech_to_text/WhisperStrategy.cpp +16 -4
  6. package/common/rnexecutorch/models/speech_to_text/WhisperStrategy.h +2 -2
  7. package/lib/Error.d.ts +30 -0
  8. package/lib/Error.js +50 -0
  9. package/lib/constants/directories.d.ts +1 -0
  10. package/lib/constants/directories.js +2 -0
  11. package/lib/constants/llmDefaults.d.ts +6 -0
  12. package/lib/constants/llmDefaults.js +16 -0
  13. package/lib/constants/modelUrls.d.ts +217 -83
  14. package/lib/constants/modelUrls.js +304 -98
  15. package/lib/constants/ocr/models.d.ts +882 -0
  16. package/lib/constants/ocr/models.js +182 -0
  17. package/lib/constants/ocr/symbols.d.ts +75 -0
  18. package/lib/constants/ocr/symbols.js +139 -0
  19. package/lib/{typescript/constants → constants}/sttDefaults.d.ts +0 -1
  20. package/lib/constants/sttDefaults.js +12 -10
  21. package/lib/controllers/LLMController.d.ts +47 -0
  22. package/lib/controllers/LLMController.js +14 -11
  23. package/lib/controllers/OCRController.d.ts +23 -0
  24. package/lib/controllers/OCRController.js +12 -5
  25. package/lib/controllers/SpeechToTextController.d.ts +8 -4
  26. package/lib/controllers/SpeechToTextController.js +15 -9
  27. package/lib/controllers/VerticalOCRController.d.ts +25 -0
  28. package/lib/controllers/VerticalOCRController.js +75 -0
  29. package/lib/hooks/computer_vision/useClassification.d.ts +15 -0
  30. package/lib/hooks/computer_vision/useClassification.js +7 -0
  31. package/lib/hooks/computer_vision/useImageEmbeddings.d.ts +15 -0
  32. package/lib/hooks/computer_vision/useImageEmbeddings.js +7 -0
  33. package/lib/hooks/computer_vision/useImageSegmentation.d.ts +38 -0
  34. package/lib/hooks/computer_vision/useImageSegmentation.js +7 -0
  35. package/lib/hooks/computer_vision/useOCR.d.ts +20 -0
  36. package/lib/hooks/computer_vision/useOCR.js +42 -0
  37. package/lib/hooks/computer_vision/useObjectDetection.d.ts +15 -0
  38. package/lib/hooks/computer_vision/useObjectDetection.js +7 -0
  39. package/lib/hooks/computer_vision/useStyleTransfer.d.ts +15 -0
  40. package/lib/hooks/computer_vision/useStyleTransfer.js +7 -0
  41. package/lib/hooks/computer_vision/useVerticalOCR.d.ts +21 -0
  42. package/lib/hooks/computer_vision/useVerticalOCR.js +45 -0
  43. package/lib/hooks/general/useExecutorchModule.d.ts +13 -0
  44. package/lib/hooks/general/useExecutorchModule.js +7 -0
  45. package/lib/hooks/natural_language_processing/useLLM.d.ts +10 -0
  46. package/lib/hooks/natural_language_processing/useLLM.js +78 -0
  47. package/lib/hooks/natural_language_processing/useSpeechToText.d.ts +27 -0
  48. package/lib/hooks/natural_language_processing/useSpeechToText.js +19 -14
  49. package/lib/hooks/natural_language_processing/useTextEmbeddings.d.ts +16 -0
  50. package/lib/hooks/natural_language_processing/useTextEmbeddings.js +7 -0
  51. package/lib/hooks/natural_language_processing/useTokenizer.d.ts +17 -0
  52. package/lib/hooks/natural_language_processing/useTokenizer.js +52 -0
  53. package/lib/hooks/useModule.d.ts +17 -0
  54. package/lib/hooks/useModule.js +45 -0
  55. package/lib/hooks/useNonStaticModule.d.ts +20 -0
  56. package/lib/hooks/useNonStaticModule.js +49 -0
  57. package/lib/index.d.ts +1 -1
  58. package/lib/index.js +3 -2
  59. package/lib/module/constants/modelUrls.js +61 -36
  60. package/lib/module/constants/modelUrls.js.map +1 -1
  61. package/lib/module/constants/ocr/models.js +1 -1
  62. package/lib/module/hooks/natural_language_processing/useSpeechToText.js +71 -34
  63. package/lib/module/hooks/natural_language_processing/useSpeechToText.js.map +1 -1
  64. package/lib/module/index.js +2 -3
  65. package/lib/module/index.js.map +1 -1
  66. package/lib/module/modules/natural_language_processing/SpeechToTextModule.js +72 -31
  67. package/lib/module/modules/natural_language_processing/SpeechToTextModule.js.map +1 -1
  68. package/lib/module/types/stt.js +1 -85
  69. package/lib/module/types/stt.js.map +1 -1
  70. package/lib/module/utils/ResourceFetcher.js +6 -8
  71. package/lib/module/utils/ResourceFetcher.js.map +1 -1
  72. package/lib/module/utils/ResourceFetcherUtils.js +20 -20
  73. package/lib/module/utils/ResourceFetcherUtils.js.map +1 -1
  74. package/lib/module/utils/SpeechToTextModule/ASR.js +191 -0
  75. package/lib/module/utils/SpeechToTextModule/ASR.js.map +1 -0
  76. package/lib/module/utils/SpeechToTextModule/OnlineProcessor.js +73 -0
  77. package/lib/module/utils/SpeechToTextModule/OnlineProcessor.js.map +1 -0
  78. package/lib/module/utils/SpeechToTextModule/hypothesisBuffer.js +56 -0
  79. package/lib/module/utils/SpeechToTextModule/hypothesisBuffer.js.map +1 -0
  80. package/lib/modules/BaseModule.d.ts +8 -0
  81. package/lib/modules/BaseModule.js +25 -0
  82. package/lib/modules/BaseNonStaticModule.d.ts +9 -0
  83. package/lib/modules/BaseNonStaticModule.js +14 -0
  84. package/lib/modules/computer_vision/ClassificationModule.d.ts +8 -0
  85. package/lib/modules/computer_vision/ClassificationModule.js +17 -0
  86. package/lib/modules/computer_vision/ImageEmbeddingsModule.d.ts +8 -0
  87. package/lib/modules/computer_vision/ImageEmbeddingsModule.js +17 -0
  88. package/lib/modules/computer_vision/ImageSegmentationModule.d.ts +11 -0
  89. package/lib/modules/computer_vision/ImageSegmentationModule.js +27 -0
  90. package/lib/modules/computer_vision/OCRModule.d.ts +15 -0
  91. package/lib/modules/computer_vision/OCRModule.js +20 -0
  92. package/lib/modules/computer_vision/ObjectDetectionModule.d.ts +9 -0
  93. package/lib/modules/computer_vision/ObjectDetectionModule.js +17 -0
  94. package/lib/modules/computer_vision/StyleTransferModule.d.ts +8 -0
  95. package/lib/modules/computer_vision/StyleTransferModule.js +17 -0
  96. package/lib/modules/computer_vision/VerticalOCRModule.d.ts +15 -0
  97. package/lib/modules/computer_vision/VerticalOCRModule.js +22 -0
  98. package/lib/modules/general/ExecutorchModule.d.ts +7 -0
  99. package/lib/modules/general/ExecutorchModule.js +14 -0
  100. package/lib/modules/natural_language_processing/LLMModule.d.ts +28 -0
  101. package/lib/modules/natural_language_processing/LLMModule.js +45 -0
  102. package/lib/modules/natural_language_processing/SpeechToTextModule.d.ts +18 -8
  103. package/lib/modules/natural_language_processing/SpeechToTextModule.js +21 -15
  104. package/lib/modules/natural_language_processing/TextEmbeddingsModule.d.ts +9 -0
  105. package/lib/modules/natural_language_processing/TextEmbeddingsModule.js +21 -0
  106. package/lib/modules/natural_language_processing/TokenizerModule.d.ts +12 -0
  107. package/lib/modules/natural_language_processing/TokenizerModule.js +5 -4
  108. package/lib/native/NativeETInstaller.d.ts +6 -0
  109. package/lib/native/NativeETInstaller.js +2 -0
  110. package/lib/native/NativeOCR.d.ts +8 -0
  111. package/lib/native/NativeOCR.js +2 -0
  112. package/lib/native/NativeVerticalOCR.d.ts +8 -0
  113. package/lib/native/NativeVerticalOCR.js +2 -0
  114. package/lib/types/common.d.ts +31 -0
  115. package/lib/types/common.js +25 -0
  116. package/lib/types/imageSegmentation.d.ts +24 -0
  117. package/lib/types/imageSegmentation.js +26 -0
  118. package/lib/types/llm.d.ts +46 -0
  119. package/lib/types/llm.js +9 -0
  120. package/lib/types/objectDetection.d.ts +104 -0
  121. package/lib/types/objectDetection.js +94 -0
  122. package/lib/types/ocr.d.ts +11 -0
  123. package/lib/types/ocr.js +1 -0
  124. package/lib/types/stt.d.ts +94 -0
  125. package/lib/types/stt.js +85 -0
  126. package/lib/typescript/constants/modelUrls.d.ts +24 -7
  127. package/lib/typescript/constants/modelUrls.d.ts.map +1 -1
  128. package/lib/typescript/constants/ocr/models.d.ts +126 -126
  129. package/lib/typescript/hooks/natural_language_processing/useSpeechToText.d.ts +15 -24
  130. package/lib/typescript/hooks/natural_language_processing/useSpeechToText.d.ts.map +1 -1
  131. package/lib/typescript/index.d.ts +2 -3
  132. package/lib/typescript/index.d.ts.map +1 -1
  133. package/lib/typescript/modules/natural_language_processing/SpeechToTextModule.d.ts +19 -22
  134. package/lib/typescript/modules/natural_language_processing/SpeechToTextModule.d.ts.map +1 -1
  135. package/lib/typescript/types/stt.d.ts +17 -91
  136. package/lib/typescript/types/stt.d.ts.map +1 -1
  137. package/lib/typescript/utils/ResourceFetcher.d.ts.map +1 -1
  138. package/lib/typescript/utils/ResourceFetcherUtils.d.ts.map +1 -1
  139. package/lib/typescript/utils/SpeechToTextModule/ASR.d.ts +27 -0
  140. package/lib/typescript/utils/SpeechToTextModule/ASR.d.ts.map +1 -0
  141. package/lib/typescript/utils/SpeechToTextModule/OnlineProcessor.d.ts +23 -0
  142. package/lib/typescript/utils/SpeechToTextModule/OnlineProcessor.d.ts.map +1 -0
  143. package/lib/typescript/utils/SpeechToTextModule/hypothesisBuffer.d.ts +13 -0
  144. package/lib/typescript/utils/SpeechToTextModule/hypothesisBuffer.d.ts.map +1 -0
  145. package/lib/utils/ResourceFetcher.d.ts +24 -0
  146. package/lib/utils/ResourceFetcher.js +305 -0
  147. package/lib/utils/ResourceFetcherUtils.d.ts +54 -0
  148. package/lib/utils/ResourceFetcherUtils.js +9 -0
  149. package/lib/utils/llm.d.ts +6 -0
  150. package/lib/utils/llm.js +1 -0
  151. package/lib/utils/stt.d.ts +1 -0
  152. package/lib/utils/stt.js +21 -0
  153. package/package.json +5 -3
  154. package/src/constants/modelUrls.ts +70 -37
  155. package/src/constants/ocr/models.ts +1 -1
  156. package/src/hooks/natural_language_processing/useSpeechToText.ts +87 -92
  157. package/src/index.ts +6 -8
  158. package/src/modules/natural_language_processing/SpeechToTextModule.ts +81 -69
  159. package/src/types/stt.ts +97 -92
  160. package/src/utils/ResourceFetcher.ts +9 -7
  161. package/src/utils/ResourceFetcherUtils.ts +15 -17
  162. package/src/utils/SpeechToTextModule/ASR.ts +303 -0
  163. package/src/utils/SpeechToTextModule/OnlineProcessor.ts +87 -0
  164. package/src/utils/SpeechToTextModule/hypothesisBuffer.ts +79 -0
  165. package/common/rnexecutorch/models/speech_to_text/MoonshineStrategy.cpp +0 -31
  166. package/common/rnexecutorch/models/speech_to_text/MoonshineStrategy.h +0 -21
  167. package/lib/module/constants/sttDefaults.js +0 -74
  168. package/lib/module/constants/sttDefaults.js.map +0 -1
  169. package/lib/module/controllers/SpeechToTextController.js +0 -320
  170. package/lib/module/controllers/SpeechToTextController.js.map +0 -1
  171. package/lib/typescript/constants/sttDefaults.d.ts.map +0 -1
  172. package/lib/typescript/controllers/SpeechToTextController.d.ts +0 -57
  173. package/lib/typescript/controllers/SpeechToTextController.d.ts.map +0 -1
  174. package/src/constants/sttDefaults.ts +0 -82
  175. package/src/controllers/SpeechToTextController.ts +0 -471
  176. package/third-party/ios/ExecutorchLib/ExecutorchLib.xcodeproj/project.xcworkspace/contents.xcworkspacedata +0 -7
  177. package/third-party/ios/ExecutorchLib/ExecutorchLib.xcodeproj/project.xcworkspace/xcuserdata/norbertklockiewicz.xcuserdatad/UserInterfaceState.xcuserstate +0 -0
  178. package/third-party/ios/ExecutorchLib/ExecutorchLib.xcodeproj/xcuserdata/norbertklockiewicz.xcuserdatad/xcschemes/xcschememanagement.plist +0 -14
@@ -0,0 +1,191 @@
1
+ "use strict";
2
+
3
+ // NOTE: This will be implemented in C++
4
+
5
+ import { TokenizerModule } from '../../modules/natural_language_processing/TokenizerModule';
6
+ import { ResourceFetcher } from '../ResourceFetcher';
7
+ export class ASR {
8
+ tokenizerModule = new TokenizerModule();
9
+ timePrecision = 0.02; // Whisper timestamp precision
10
+ maxDecodeLength = 128;
11
+ chunkSize = 30; // 30 seconds
12
+ minChunkSamples = 1 * 16000; // 1 second
13
+ samplingRate = 16000;
14
+ async load(model, onDownloadProgressCallback) {
15
+ const tokenizerLoadPromise = this.tokenizerModule.load(model);
16
+ const encoderDecoderPromise = ResourceFetcher.fetch(onDownloadProgressCallback, model.encoderSource, model.decoderSource);
17
+ const [_, encoderDecoderResults] = await Promise.all([tokenizerLoadPromise, encoderDecoderPromise]);
18
+ const encoderSource = encoderDecoderResults?.[0];
19
+ const decoderSource = encoderDecoderResults?.[1];
20
+ if (!encoderSource || !decoderSource) {
21
+ throw new Error('Download interrupted.');
22
+ }
23
+ this.nativeModule = await global.loadSpeechToText(encoderSource, decoderSource, 'whisper');
24
+ this.startOfTranscriptToken = await this.tokenizerModule.tokenToId('<|startoftranscript|>');
25
+ this.endOfTextToken = await this.tokenizerModule.tokenToId('<|endoftext|>');
26
+ this.timestampBeginToken = await this.tokenizerModule.tokenToId('<|0.00|>');
27
+ }
28
+ async getInitialSequence(options) {
29
+ const initialSequence = [this.startOfTranscriptToken];
30
+ if (options.language) {
31
+ const languageToken = await this.tokenizerModule.tokenToId(`<|${options.language}|>`);
32
+ const taskToken = await this.tokenizerModule.tokenToId('<|transcribe|>');
33
+ initialSequence.push(languageToken);
34
+ initialSequence.push(taskToken);
35
+ }
36
+ initialSequence.push(this.timestampBeginToken);
37
+ return initialSequence;
38
+ }
39
+ async generate(audio, temperature, options) {
40
+ await this.encode(new Float32Array(audio));
41
+ const initialSequence = await this.getInitialSequence(options);
42
+ const sequencesIds = [...initialSequence];
43
+ const scores = [];
44
+ while (sequencesIds.length <= this.maxDecodeLength) {
45
+ const logits = this.softmaxWithTemperature(Array.from(await this.decode(sequencesIds)), temperature === 0 ? 1 : temperature);
46
+ const nextTokenId = temperature === 0 ? logits.indexOf(Math.max(...logits)) : this.sampleFromDistribution(logits);
47
+ const nextTokenProb = logits[nextTokenId];
48
+ sequencesIds.push(nextTokenId);
49
+ scores.push(nextTokenProb);
50
+ if (nextTokenId === this.endOfTextToken) {
51
+ break;
52
+ }
53
+ }
54
+ return {
55
+ sequencesIds: sequencesIds.slice(initialSequence.length),
56
+ scores: scores.slice(initialSequence.length)
57
+ };
58
+ }
59
+ softmaxWithTemperature(logits, temperature = 1.0) {
60
+ const max = Math.max(...logits);
61
+ const exps = logits.map(logit => Math.exp((logit - max) / temperature));
62
+ const sum = exps.reduce((a, b) => a + b, 0);
63
+ return exps.map(exp => exp / sum);
64
+ }
65
+ sampleFromDistribution(probs) {
66
+ const r = Math.random();
67
+ let cumulative = 0;
68
+ for (let i = 0; i < probs.length; i++) {
69
+ cumulative += probs[i];
70
+ if (r < cumulative) {
71
+ return i;
72
+ }
73
+ }
74
+ return probs.length - 1;
75
+ }
76
+ async generateWithFallback(audio, options) {
77
+ const temperatures = [0.0, 0.2, 0.4, 0.6, 0.8, 1.0];
78
+ let generatedTokens = [];
79
+ for (const temperature of temperatures) {
80
+ const result = await this.generate(audio, temperature, options);
81
+ const tokens = result.sequencesIds;
82
+ const scores = result.scores;
83
+ const seqLen = tokens.length;
84
+ const cumLogProb = scores.reduce((acc, score) => acc + Math.log(score), 0);
85
+ const avgLogProb = cumLogProb / seqLen;
86
+ if (avgLogProb >= -1.0) {
87
+ generatedTokens = tokens;
88
+ break;
89
+ }
90
+ }
91
+ return this.calculateWordLevelTimestamps(generatedTokens, audio);
92
+ }
93
+ async calculateWordLevelTimestamps(generatedTokens, audio) {
94
+ const segments = [];
95
+ let tokens = [];
96
+ let prevTimestamp = this.timestampBeginToken;
97
+ for (let i = 0; i < generatedTokens.length; i++) {
98
+ if (generatedTokens[i] < this.timestampBeginToken) {
99
+ tokens.push(generatedTokens[i]);
100
+ }
101
+ if (i > 0 && generatedTokens[i - 1] >= this.timestampBeginToken && generatedTokens[i] >= this.timestampBeginToken) {
102
+ const start = prevTimestamp;
103
+ const end = generatedTokens[i - 1];
104
+ const wordObjects = await this.estimateWordTimestampsLinear(tokens, start, end);
105
+ segments.push({
106
+ words: wordObjects
107
+ });
108
+ tokens = [];
109
+ prevTimestamp = generatedTokens[i];
110
+ }
111
+ }
112
+ const start = prevTimestamp;
113
+ const end = generatedTokens.at(-2);
114
+ const wordObjects = await this.estimateWordTimestampsLinear(tokens, start, end);
115
+ segments.push({
116
+ words: wordObjects
117
+ });
118
+ const scalingFactor = audio.length / this.samplingRate / ((end - this.timestampBeginToken) * this.timePrecision);
119
+ if (scalingFactor < 1) {
120
+ for (const segment of segments) {
121
+ for (const word of segment.words) {
122
+ word.start *= scalingFactor;
123
+ word.end *= scalingFactor;
124
+ }
125
+ }
126
+ }
127
+ return segments;
128
+ }
129
+ async estimateWordTimestampsLinear(tokens, start, end) {
130
+ const duration = (end - start) * this.timePrecision;
131
+ const segmentText = (await this.tokenizerModule.decode(tokens)).trim();
132
+ const words = segmentText.split(' ').map(w => ` ${w}`);
133
+ const numOfCharacters = words.reduce((acc, word) => acc + word.length, 0);
134
+ const timePerCharacter = duration / numOfCharacters;
135
+ const wordObjects = [];
136
+ const startTimeOffset = (start - this.timestampBeginToken) * this.timePrecision;
137
+ let prevCharNum = 0;
138
+ for (let j = 0; j < words.length; j++) {
139
+ const word = words[j];
140
+ const start = startTimeOffset + prevCharNum * timePerCharacter;
141
+ const end = start + timePerCharacter * word.length;
142
+ wordObjects.push({
143
+ word,
144
+ start,
145
+ end
146
+ });
147
+ prevCharNum += word.length;
148
+ }
149
+ return wordObjects;
150
+ }
151
+ async transcribe(audio, options) {
152
+ let seek = 0;
153
+ const allSegments = [];
154
+ while (seek * this.samplingRate < audio.length) {
155
+ const chunk = audio.slice(seek * this.samplingRate, (seek + this.chunkSize) * this.samplingRate);
156
+ if (chunk.length < this.minChunkSamples) {
157
+ return allSegments;
158
+ }
159
+ const segments = await this.generateWithFallback(chunk, options);
160
+ for (const segment of segments) {
161
+ for (const word of segment.words) {
162
+ word.start += seek;
163
+ word.end += seek;
164
+ }
165
+ }
166
+ allSegments.push(...segments);
167
+ const lastTimeStamp = segments.at(-1).words.at(-1).end;
168
+ seek = lastTimeStamp;
169
+ }
170
+ return allSegments;
171
+ }
172
+ tsWords(segments) {
173
+ const o = [];
174
+ for (const segment of segments) {
175
+ for (const word of segment.words) {
176
+ o.push([word.start, word.end, word.word]);
177
+ }
178
+ }
179
+ return o;
180
+ }
181
+ segmentsEndTs(res) {
182
+ return res.map(segment => segment.words.at(-1).end);
183
+ }
184
+ async encode(waveform) {
185
+ await this.nativeModule.encode(waveform);
186
+ }
187
+ async decode(tokens) {
188
+ return new Float32Array(await this.nativeModule.decode(tokens));
189
+ }
190
+ }
191
+ //# sourceMappingURL=ASR.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"names":["TokenizerModule","ResourceFetcher","ASR","tokenizerModule","timePrecision","maxDecodeLength","chunkSize","minChunkSamples","samplingRate","load","model","onDownloadProgressCallback","tokenizerLoadPromise","encoderDecoderPromise","fetch","encoderSource","decoderSource","_","encoderDecoderResults","Promise","all","Error","nativeModule","global","loadSpeechToText","startOfTranscriptToken","tokenToId","endOfTextToken","timestampBeginToken","getInitialSequence","options","initialSequence","language","languageToken","taskToken","push","generate","audio","temperature","encode","Float32Array","sequencesIds","scores","length","logits","softmaxWithTemperature","Array","from","decode","nextTokenId","indexOf","Math","max","sampleFromDistribution","nextTokenProb","slice","exps","map","logit","exp","sum","reduce","a","b","probs","r","random","cumulative","i","generateWithFallback","temperatures","generatedTokens","result","tokens","seqLen","cumLogProb","acc","score","log","avgLogProb","calculateWordLevelTimestamps","segments","prevTimestamp","start","end","wordObjects","estimateWordTimestampsLinear","words","at","scalingFactor","segment","word","duration","segmentText","trim","split","w","numOfCharacters","timePerCharacter","startTimeOffset","prevCharNum","j","transcribe","seek","allSegments","chunk","lastTimeStamp","tsWords","o","segmentsEndTs","res","waveform"],"sourceRoot":"../../../../src","sources":["utils/SpeechToTextModule/ASR.ts"],"mappings":";;AAAA;;AAEA,SAASA,eAAe,QAAQ,2DAA2D;AAQ3F,SAASC,eAAe,QAAQ,oBAAoB;AAEpD,OAAO,MAAMC,GAAG,CAAC;EAEPC,eAAe,GAAoB,IAAIH,eAAe,CAAC,CAAC;EAExDI,aAAa,GAAW,IAAI,CAAC,CAAC;EAC9BC,eAAe,GAAW,GAAG;EAC7BC,SAAS,GAAW,EAAE,CAAC,CAAC;EACxBC,eAAe,GAAW,CAAC,GAAG,KAAK,CAAC,CAAC;EACrCC,YAAY,GAAW,KAAK;EAMpC,MAAaC,IAAIA,CACfC,KAA8B,EAC9BC,0BAAsD,EACtD;IACA,MAAMC,oBAAoB,GAAG,IAAI,CAACT,eAAe,CAACM,IAAI,CAACC,KAAK,CAAC;IAC7D,MAAMG,qBAAqB,GAAGZ,eAAe,CAACa,KAAK,CACjDH,0BAA0B,EAC1BD,KAAK,CAACK,aAAa,EACnBL,KAAK,CAACM,aACR,CAAC;IACD,MAAM,CAACC,CAAC,EAAEC,qBAAqB,CAAC,GAAG,MAAMC,OAAO,CAACC,GAAG,CAAC,CACnDR,oBAAoB,EACpBC,qBAAqB,CACtB,CAAC;IACF,MAAME,aAAa,GAAGG,qBAAqB,GAAG,CAAC,CAAC;IAChD,MAAMF,aAAa,GAAGE,qBAAqB,GAAG,CAAC,CAAC;IAChD,IAAI,CAACH,aAAa,IAAI,CAACC,aAAa,EAAE;MACpC,MAAM,IAAIK,KAAK,CAAC,uBAAuB,CAAC;IAC1C;IACA,IAAI,CAACC,YAAY,GAAG,MAAMC,MAAM,CAACC,gBAAgB,CAC/CT,aAAa,EACbC,aAAa,EACb,SACF,CAAC;IAED,IAAI,CAACS,sBAAsB,GAAG,MAAM,IAAI,CAACtB,eAAe,CAACuB,SAAS,CAChE,uBACF,CAAC;IACD,IAAI,CAACC,cAAc,GAAG,MAAM,IAAI,CAACxB,eAAe,CAACuB,SAAS,CAAC,eAAe,CAAC;IAC3E,IAAI,CAACE,mBAAmB,GAAG,MAAM,IAAI,CAACzB,eAAe,CAACuB,SAAS,CAAC,UAAU,CAAC;EAC7E;EAEA,MAAcG,kBAAkBA,CAC9BC,OAAwB,EACL;IACnB,MAAMC,eAAyB,GAAG,CAAC,IAAI,CAACN,sBAAsB,CAAC;IAC/D,IAAIK,OAAO,CAACE,QAAQ,EAAE;MACpB,MAAMC,aAAa,GAAG,MAAM,IAAI,CAAC9B,eAAe,CAACuB,SAAS,CACxD,KAAKI,OAAO,CAACE,QAAQ,IACvB,CAAC;MACD,MAAME,SAAS,GAAG,MAAM,IAAI,CAAC/B,eAAe,CAACuB,SAAS,CAAC,gBAAgB,CAAC;MACxEK,eAAe,CAACI,IAAI,CAACF,aAAa,CAAC;MACnCF,eAAe,CAACI,IAAI,CAACD,SAAS,CAAC;IACjC;IACAH,eAAe,CAACI,IAAI,CAAC,IAAI,CAACP,mBAAmB,CAAC;IAC9C,OAAOG,eAAe;EACxB;EAEA,MAAcK,QAAQA,CACpBC,KAAe,EACfC,WAAmB,EACnBR,OAAwB,EAIvB;IACD,MAAM,IAAI,CAACS,MAAM,CAAC,IAAIC,YAAY,CAACH,KAAK,CAAC,CAAC;IAC1C,MAAMN,eAAe,GAAG,MAAM,IAAI,CAACF,kBAAkB,CAACC,OAAO,CAAC;IAC9D,MAAMW,YAAY,GAAG,CAAC,GAAGV,eAAe,CAAC;IACzC,MAAMW,MAAgB,GAAG,EAAE;IAE3B,OAAOD,YAAY,CAACE,MAAM,IAAI,IAAI,CAACtC,eAAe,EAAE;MAClD,MAAMuC,MAAM,GAAG,IAAI,CAACC,sBAAsB,CACxCC,KAAK,CAACC,IAAI,CAAC,MAAM,IAAI,CAACC,MAAM,CAACP,YAAY,CAAC,CAAC,EAC3CH,WAAW,KAAK,CAAC,GAAG,CAAC,GAAGA,WAC1B,CAAC;MACD,MAAMW,WAAW,GACfX,WAAW,KAAK,CAAC,GACbM,MAAM,CAACM,OAAO,CAACC,IAAI,CAACC,GAAG,CAAC,GAAGR,MAAM,CAAC,CAAC,GACnC,IAAI,CAACS,sBAAsB,CAACT,MAAM,CAAC;MACzC,MAAMU,aAAa,GAAGV,MAAM,CAACK,WAAW,CAAE;MAC1CR,YAAY,CAACN,IAAI,CAACc,WAAW,CAAC;MAC9BP,MAAM,CAACP,IAAI,CAACmB,aAAa,CAAC;MAC1B,IAAIL,WAAW,KAAK,IAAI,CAACtB,cAAc,EAAE;QACvC;MACF;IACF;IAEA,OAAO;MACLc,YAAY,EAAEA,YAAY,CAACc,KAAK,CAACxB,eAAe,CAACY,MAAM,CAAC;MACxDD,MAAM,EAAEA,MAAM,CAACa,KAAK,CAACxB,eAAe,CAACY,MAAM;IAC7C,CAAC;EACH;EAEQE,sBAAsBA,CAACD,MAAgB,EAAEN,WAAW,GAAG,GAAG,EAAE;IAClE,MAAMc,GAAG,GAAGD,IAAI,CAACC,GAAG,CAAC,GAAGR,MAAM,CAAC;IAC/B,MAAMY,IAAI,GAAGZ,MAAM,CAACa,GAAG,CAAEC,KAAK,IAAKP,IAAI,CAACQ,GAAG,CAAC,CAACD,KAAK,GAAGN,GAAG,IAAId,WAAW,CAAC,CAAC;IACzE,MAAMsB,GAAG,GAAGJ,IAAI,CAACK,MAAM,CAAC,CAACC,CAAC,EAAEC,CAAC,KAAKD,CAAC,GAAGC,CAAC,EAAE,CAAC,CAAC;IAC3C,OAAOP,IAAI,CAACC,GAAG,CAAEE,GAAG,IAAKA,GAAG,GAAGC,GAAG,CAAC;EACrC;EAEQP,sBAAsBA,CAACW,KAAe,EAAU;IACtD,MAAMC,CAAC,GAAGd,IAAI,CAACe,MAAM,CAAC,CAAC;IACvB,IAAIC,UAAU,GAAG,CAAC;IAClB,KAAK,IAAIC,CAAC,GAAG,CAAC,EAAEA,CAAC,GAAGJ,KAAK,CAACrB,MAAM,EAAEyB,CAAC,EAAE,EAAE;MACrCD,UAAU,IAAIH,KAAK,CAACI,CAAC,CAAE;MACvB,IAAIH,CAAC,GAAGE,UAAU,EAAE;QAClB,OAAOC,CAAC;MACV;IACF;IACA,OAAOJ,KAAK,CAACrB,MAAM,GAAG,CAAC;EACzB;EAEA,MAAc0B,oBAAoBA,CAChChC,KAAe,EACfP,OAAwB,EACxB;IACA,MAAMwC,YAAY,GAAG,CAAC,GAAG,EAAE,GAAG,EAAE,GAAG,EAAE,GAAG,EAAE,GAAG,EAAE,GAAG,CAAC;IACnD,IAAIC,eAAyB,GAAG,EAAE;IAElC,KAAK,MAAMjC,WAAW,IAAIgC,YAAY,EAAE;MACtC,MAAME,MAAM,GAAG,MAAM,IAAI,CAACpC,QAAQ,CAACC,KAAK,EAAEC,WAAW,EAAER,OAAO,CAAC;MAC/D,MAAM2C,MAAM,GAAGD,MAAM,CAAC/B,YAAY;MAClC,MAAMC,MAAM,GAAG8B,MAAM,CAAC9B,MAAM;MAE5B,MAAMgC,MAAM,GAAGD,MAAM,CAAC9B,MAAM;MAC5B,MAAMgC,UAAU,GAAGjC,MAAM,CAACmB,MAAM,CAC9B,CAACe,GAAG,EAAEC,KAAK,KAAKD,GAAG,GAAGzB,IAAI,CAAC2B,GAAG,CAACD,KAAK,CAAC,EACrC,CACF,CAAC;MACD,MAAME,UAAU,GAAGJ,UAAU,GAAGD,MAAM;MAEtC,IAAIK,UAAU,IAAI,CAAC,GAAG,EAAE;QACtBR,eAAe,GAAGE,MAAM;QACxB;MACF;IACF;IAEA,OAAO,IAAI,CAACO,4BAA4B,CAACT,eAAe,EAAElC,KAAK,CAAC;EAClE;EAEA,MAAc2C,4BAA4BA,CACxCT,eAAyB,EACzBlC,KAAe,EACK;IACpB,MAAM4C,QAAmB,GAAG,EAAE;IAE9B,IAAIR,MAAgB,GAAG,EAAE;IACzB,IAAIS,aAAa,GAAG,IAAI,CAACtD,mBAAmB;IAC5C,KAAK,IAAIwC,CAAC,GAAG,CAAC,EAAEA,CAAC,GAAGG,eAAe,CAAC5B,MAAM,EAAEyB,CAAC,EAAE,EAAE;MAC/C,IAAIG,eAAe,CAACH,CAAC,CAAC,GAAI,IAAI,CAACxC,mBAAmB,EAAE;QAClD6C,MAAM,CAACtC,IAAI,CAACoC,eAAe,CAACH,CAAC,CAAE,CAAC;MAClC;MAEA,IACEA,CAAC,GAAG,CAAC,IACLG,eAAe,CAACH,CAAC,GAAG,CAAC,CAAC,IAAK,IAAI,CAACxC,mBAAmB,IACnD2C,eAAe,CAACH,CAAC,CAAC,IAAK,IAAI,CAACxC,mBAAmB,EAC/C;QACA,MAAMuD,KAAK,GAAGD,aAAa;QAC3B,MAAME,GAAG,GAAGb,eAAe,CAACH,CAAC,GAAG,CAAC,CAAE;QACnC,MAAMiB,WAAW,GAAG,MAAM,IAAI,CAACC,4BAA4B,CACzDb,MAAM,EACNU,KAAK,EACLC,GACF,CAAC;QACDH,QAAQ,CAAC9C,IAAI,CAAC;UACZoD,KAAK,EAAEF;QACT,CAAC,CAAC;QACFZ,MAAM,GAAG,EAAE;QACXS,aAAa,GAAGX,eAAe,CAACH,CAAC,CAAE;MACrC;IACF;IAEA,MAAMe,KAAK,GAAGD,aAAa;IAC3B,MAAME,GAAG,GAAGb,eAAe,CAACiB,EAAE,CAAC,CAAC,CAAC,CAAE;IACnC,MAAMH,WAAW,GAAG,MAAM,IAAI,CAACC,4BAA4B,CACzDb,MAAM,EACNU,KAAK,EACLC,GACF,CAAC;IACDH,QAAQ,CAAC9C,IAAI,CAAC;MACZoD,KAAK,EAAEF;IACT,CAAC,CAAC;IAEF,MAAMI,aAAa,GACjBpD,KAAK,CAACM,MAAM,GACZ,IAAI,CAACnC,YAAY,IAChB,CAAC4E,GAAG,GAAG,IAAI,CAACxD,mBAAmB,IAAI,IAAI,CAACxB,aAAa,CAAC;IACzD,IAAIqF,aAAa,GAAG,CAAC,EAAE;MACrB,KAAK,MAAMC,OAAO,IAAIT,QAAQ,EAAE;QAC9B,KAAK,MAAMU,IAAI,IAAID,OAAO,CAACH,KAAK,EAAE;UAChCI,IAAI,CAACR,KAAK,IAAIM,aAAa;UAC3BE,IAAI,CAACP,GAAG,IAAIK,aAAa;QAC3B;MACF;IACF;IAEA,OAAOR,QAAQ;EACjB;EAEA,MAAcK,4BAA4BA,CACxCb,MAAgB,EAChBU,KAAa,EACbC,GAAW,EACY;IACvB,MAAMQ,QAAQ,GAAG,CAACR,GAAG,GAAGD,KAAK,IAAI,IAAI,CAAC/E,aAAa;IACnD,MAAMyF,WAAW,GAAG,CACjB,MAAM,IAAI,CAAC1F,eAAe,CAAC6C,MAAM,CAACyB,MAAM,CAAC,EAC1CqB,IAAI,CAAC,CAAC;IAER,MAAMP,KAAK,GAAGM,WAAW,CAACE,KAAK,CAAC,GAAG,CAAC,CAACtC,GAAG,CAAEuC,CAAC,IAAK,IAAIA,CAAC,EAAE,CAAC;IACxD,MAAMC,eAAe,GAAGV,KAAK,CAAC1B,MAAM,CAClC,CAACe,GAAW,EAAEe,IAAY,KAAKf,GAAG,GAAGe,IAAI,CAAChD,MAAM,EAChD,CACF,CAAC;IAED,MAAMuD,gBAAgB,GAAGN,QAAQ,GAAGK,eAAe;IAEnD,MAAMZ,WAAyB,GAAG,EAAE;IACpC,MAAMc,eAAe,GACnB,CAAChB,KAAK,GAAG,IAAI,CAACvD,mBAAmB,IAAI,IAAI,CAACxB,aAAa;IAEzD,IAAIgG,WAAW,GAAG,CAAC;IACnB,KAAK,IAAIC,CAAC,GAAG,CAAC,EAAEA,CAAC,GAAGd,KAAK,CAAC5C,MAAM,EAAE0D,CAAC,EAAE,EAAE;MACrC,MAAMV,IAAI,GAAGJ,KAAK,CAACc,CAAC,CAAE;MACtB,MAAMlB,KAAK,GAAGgB,eAAe,GAAGC,WAAW,GAAGF,gBAAgB;MAC9D,MAAMd,GAAG,GAAGD,KAAK,GAAGe,gBAAgB,GAAGP,IAAI,CAAChD,MAAM;MAClD0C,WAAW,CAAClD,IAAI,CAAC;QAAEwD,IAAI;QAAER,KAAK;QAAEC;MAAI,CAAC,CAAC;MACtCgB,WAAW,IAAIT,IAAI,CAAChD,MAAM;IAC5B;IAEA,OAAO0C,WAAW;EACpB;EAEA,MAAaiB,UAAUA,CACrBjE,KAAe,EACfP,OAAwB,EACJ;IACpB,IAAIyE,IAAI,GAAG,CAAC;IACZ,MAAMC,WAAsB,GAAG,EAAE;IAEjC,OAAOD,IAAI,GAAG,IAAI,CAAC/F,YAAY,GAAG6B,KAAK,CAACM,MAAM,EAAE;MAC9C,MAAM8D,KAAK,GAAGpE,KAAK,CAACkB,KAAK,CACvBgD,IAAI,GAAG,IAAI,CAAC/F,YAAY,EACxB,CAAC+F,IAAI,GAAG,IAAI,CAACjG,SAAS,IAAI,IAAI,CAACE,YACjC,CAAC;MACD,IAAIiG,KAAK,CAAC9D,MAAM,GAAG,IAAI,CAACpC,eAAe,EAAE;QACvC,OAAOiG,WAAW;MACpB;MACA,MAAMvB,QAAQ,GAAG,MAAM,IAAI,CAACZ,oBAAoB,CAACoC,KAAK,EAAE3E,OAAO,CAAC;MAChE,KAAK,MAAM4D,OAAO,IAAIT,QAAQ,EAAE;QAC9B,KAAK,MAAMU,IAAI,IAAID,OAAO,CAACH,KAAK,EAAE;UAChCI,IAAI,CAACR,KAAK,IAAIoB,IAAI;UAClBZ,IAAI,CAACP,GAAG,IAAImB,IAAI;QAClB;MACF;MACAC,WAAW,CAACrE,IAAI,CAAC,GAAG8C,QAAQ,CAAC;MAC7B,MAAMyB,aAAa,GAAGzB,QAAQ,CAACO,EAAE,CAAC,CAAC,CAAC,CAAC,CAAED,KAAK,CAACC,EAAE,CAAC,CAAC,CAAC,CAAC,CAAEJ,GAAG;MACxDmB,IAAI,GAAGG,aAAa;IACtB;IAEA,OAAOF,WAAW;EACpB;EAEOG,OAAOA,CAAC1B,QAAmB,EAAe;IAC/C,MAAM2B,CAAc,GAAG,EAAE;IACzB,KAAK,MAAMlB,OAAO,IAAIT,QAAQ,EAAE;MAC9B,KAAK,MAAMU,IAAI,IAAID,OAAO,CAACH,KAAK,EAAE;QAChCqB,CAAC,CAACzE,IAAI,CAAC,CAACwD,IAAI,CAACR,KAAK,EAAEQ,IAAI,CAACP,GAAG,EAAEO,IAAI,CAACA,IAAI,CAAC,CAAC;MAC3C;IACF;IACA,OAAOiB,CAAC;EACV;EAEOC,aAAaA,CAACC,GAAc,EAAE;IACnC,OAAOA,GAAG,CAACrD,GAAG,CAAEiC,OAAO,IAAKA,OAAO,CAACH,KAAK,CAACC,EAAE,CAAC,CAAC,CAAC,CAAC,CAAEJ,GAAG,CAAC;EACxD;EAEA,MAAa7C,MAAMA,CAACwE,QAAsB,EAAiB;IACzD,MAAM,IAAI,CAACzF,YAAY,CAACiB,MAAM,CAACwE,QAAQ,CAAC;EAC1C;EAEA,MAAa/D,MAAMA,CAACyB,MAAgB,EAAyB;IAC3D,OAAO,IAAIjC,YAAY,CAAC,MAAM,IAAI,CAAClB,YAAY,CAAC0B,MAAM,CAACyB,MAAM,CAAC,CAAC;EACjE;AACF","ignoreList":[]}
@@ -0,0 +1,73 @@
1
+ "use strict";
2
+
3
+ // NOTE: This will be implemented in C++
4
+
5
+ import { HypothesisBuffer } from './hypothesisBuffer';
6
+ export class OnlineASRProcessor {
7
+ samplingRate = 16000;
8
+ audioBuffer = [];
9
+ transcriptBuffer = new HypothesisBuffer();
10
+ bufferTimeOffset = 0;
11
+ committed = [];
12
+ constructor(asr) {
13
+ this.asr = asr;
14
+ }
15
+ insertAudioChunk(audio) {
16
+ this.audioBuffer.push(...audio);
17
+ }
18
+ async processIter(options) {
19
+ const res = await this.asr.transcribe(this.audioBuffer, options);
20
+ const tsw = this.asr.tsWords(res);
21
+ this.transcriptBuffer.insert(tsw, this.bufferTimeOffset);
22
+ const o = this.transcriptBuffer.flush();
23
+ this.committed.push(...o);
24
+ const s = 15;
25
+ if (this.audioBuffer.length / this.samplingRate > s) {
26
+ this.chunkCompletedSegment(res);
27
+ }
28
+ const committed = this.toFlush(o)[2];
29
+ const nonCommitted = this.transcriptBuffer.complete().map(x => x[2]).join('');
30
+ return {
31
+ committed,
32
+ nonCommitted
33
+ };
34
+ }
35
+ chunkCompletedSegment(res) {
36
+ if (this.committed.length === 0) {
37
+ return;
38
+ }
39
+ const ends = this.asr.segmentsEndTs(res);
40
+ const t = this.committed.at(-1)[1];
41
+ if (ends.length > 1) {
42
+ let e = ends.at(-2) + this.bufferTimeOffset;
43
+ while (ends.length > 2 && e > t) {
44
+ ends.pop();
45
+ e = ends.at(-2) + this.bufferTimeOffset;
46
+ }
47
+ if (e <= t) {
48
+ this.chunkAt(e);
49
+ }
50
+ }
51
+ }
52
+ chunkAt(time) {
53
+ this.transcriptBuffer.popCommitted(time);
54
+ const cutSeconds = time - this.bufferTimeOffset;
55
+ this.audioBuffer = this.audioBuffer.slice(Math.floor(cutSeconds * this.samplingRate));
56
+ this.bufferTimeOffset = time;
57
+ }
58
+ async finish() {
59
+ const o = this.transcriptBuffer.complete();
60
+ const f = this.toFlush(o);
61
+ this.bufferTimeOffset += this.audioBuffer.length / this.samplingRate;
62
+ return {
63
+ committed: f[2]
64
+ };
65
+ }
66
+ toFlush(words) {
67
+ const t = words.map(s => s[2]).join(' ');
68
+ const b = words.length === 0 ? null : words[0][0];
69
+ const e = words.length === 0 ? null : words.at(-1)[1];
70
+ return [b, e, t];
71
+ }
72
+ }
73
+ //# sourceMappingURL=OnlineProcessor.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"names":["HypothesisBuffer","OnlineASRProcessor","samplingRate","audioBuffer","transcriptBuffer","bufferTimeOffset","committed","constructor","asr","insertAudioChunk","audio","push","processIter","options","res","transcribe","tsw","tsWords","insert","o","flush","s","length","chunkCompletedSegment","toFlush","nonCommitted","complete","map","x","join","ends","segmentsEndTs","t","at","e","pop","chunkAt","time","popCommitted","cutSeconds","slice","Math","floor","finish","f","words","b"],"sourceRoot":"../../../../src","sources":["utils/SpeechToTextModule/OnlineProcessor.ts"],"mappings":";;AAAA;;AAIA,SAASA,gBAAgB,QAAQ,oBAAoB;AAErD,OAAO,MAAMC,kBAAkB,CAAC;EAGtBC,YAAY,GAAW,KAAK;EAC7BC,WAAW,GAAa,EAAE;EACzBC,gBAAgB,GAAqB,IAAIJ,gBAAgB,CAAC,CAAC;EAC3DK,gBAAgB,GAAW,CAAC;EAC5BC,SAAS,GAAgB,EAAE;EAEnCC,WAAWA,CAACC,GAAQ,EAAE;IACpB,IAAI,CAACA,GAAG,GAAGA,GAAG;EAChB;EAEOC,gBAAgBA,CAACC,KAAe,EAAE;IACvC,IAAI,CAACP,WAAW,CAACQ,IAAI,CAAC,GAAGD,KAAK,CAAC;EACjC;EAEA,MAAaE,WAAWA,CAACC,OAAwB,EAAE;IACjD,MAAMC,GAAG,GAAG,MAAM,IAAI,CAACN,GAAG,CAACO,UAAU,CAAC,IAAI,CAACZ,WAAW,EAAEU,OAAO,CAAC;IAChE,MAAMG,GAAG,GAAG,IAAI,CAACR,GAAG,CAACS,OAAO,CAACH,GAAG,CAAC;IACjC,IAAI,CAACV,gBAAgB,CAACc,MAAM,CAACF,GAAG,EAAE,IAAI,CAACX,gBAAgB,CAAC;IACxD,MAAMc,CAAC,GAAG,IAAI,CAACf,gBAAgB,CAACgB,KAAK,CAAC,CAAC;IACvC,IAAI,CAACd,SAAS,CAACK,IAAI,CAAC,GAAGQ,CAAC,CAAC;IAEzB,MAAME,CAAC,GAAG,EAAE;IACZ,IAAI,IAAI,CAAClB,WAAW,CAACmB,MAAM,GAAG,IAAI,CAACpB,YAAY,GAAGmB,CAAC,EAAE;MACnD,IAAI,CAACE,qBAAqB,CAACT,GAAG,CAAC;IACjC;IAEA,MAAMR,SAAS,GAAG,IAAI,CAACkB,OAAO,CAACL,CAAC,CAAC,CAAC,CAAC,CAAC;IACpC,MAAMM,YAAY,GAAG,IAAI,CAACrB,gBAAgB,CACvCsB,QAAQ,CAAC,CAAC,CACVC,GAAG,CAAEC,CAAC,IAAKA,CAAC,CAAC,CAAC,CAAC,CAAC,CAChBC,IAAI,CAAC,EAAE,CAAC;IACX,OAAO;MAAEvB,SAAS;MAAEmB;IAAa,CAAC;EACpC;EAEQF,qBAAqBA,CAACT,GAAc,EAAE;IAC5C,IAAI,IAAI,CAACR,SAAS,CAACgB,MAAM,KAAK,CAAC,EAAE;MAC/B;IACF;IAEA,MAAMQ,IAAI,GAAG,IAAI,CAACtB,GAAG,CAACuB,aAAa,CAACjB,GAAG,CAAC;IACxC,MAAMkB,CAAC,GAAG,IAAI,CAAC1B,SAAS,CAAC2B,EAAE,CAAC,CAAC,CAAC,CAAC,CAAE,CAAC,CAAC;IAEnC,IAAIH,IAAI,CAACR,MAAM,GAAG,CAAC,EAAE;MACnB,IAAIY,CAAC,GAAGJ,IAAI,CAACG,EAAE,CAAC,CAAC,CAAC,CAAC,GAAI,IAAI,CAAC5B,gBAAgB;MAC5C,OAAOyB,IAAI,CAACR,MAAM,GAAG,CAAC,IAAIY,CAAC,GAAGF,CAAC,EAAE;QAC/BF,IAAI,CAACK,GAAG,CAAC,CAAC;QACVD,CAAC,GAAGJ,IAAI,CAACG,EAAE,CAAC,CAAC,CAAC,CAAC,GAAI,IAAI,CAAC5B,gBAAgB;MAC1C;MAEA,IAAI6B,CAAC,IAAIF,CAAC,EAAE;QACV,IAAI,CAACI,OAAO,CAACF,CAAC,CAAC;MACjB;IACF;EACF;EAEQE,OAAOA,CAACC,IAAY,EAAE;IAC5B,IAAI,CAACjC,gBAAgB,CAACkC,YAAY,CAACD,IAAI,CAAC;IACxC,MAAME,UAAU,GAAGF,IAAI,GAAG,IAAI,CAAChC,gBAAgB;IAC/C,IAAI,CAACF,WAAW,GAAG,IAAI,CAACA,WAAW,CAACqC,KAAK,CACvCC,IAAI,CAACC,KAAK,CAACH,UAAU,GAAG,IAAI,CAACrC,YAAY,CAC3C,CAAC;IACD,IAAI,CAACG,gBAAgB,GAAGgC,IAAI;EAC9B;EAEA,MAAaM,MAAMA,CAAA,EAAG;IACpB,MAAMxB,CAAC,GAAG,IAAI,CAACf,gBAAgB,CAACsB,QAAQ,CAAC,CAAC;IAC1C,MAAMkB,CAAC,GAAG,IAAI,CAACpB,OAAO,CAACL,CAAC,CAAC;IACzB,IAAI,CAACd,gBAAgB,IAAI,IAAI,CAACF,WAAW,CAACmB,MAAM,GAAG,IAAI,CAACpB,YAAY;IACpE,OAAO;MAAEI,SAAS,EAAEsC,CAAC,CAAC,CAAC;IAAE,CAAC;EAC5B;EAEQpB,OAAOA,CAACqB,KAAkB,EAA0C;IAC1E,MAAMb,CAAC,GAAGa,KAAK,CAAClB,GAAG,CAAEN,CAAC,IAAKA,CAAC,CAAC,CAAC,CAAC,CAAC,CAACQ,IAAI,CAAC,GAAG,CAAC;IAC1C,MAAMiB,CAAC,GAAGD,KAAK,CAACvB,MAAM,KAAK,CAAC,GAAG,IAAI,GAAGuB,KAAK,CAAC,CAAC,CAAC,CAAE,CAAC,CAAC;IAClD,MAAMX,CAAC,GAAGW,KAAK,CAACvB,MAAM,KAAK,CAAC,GAAG,IAAI,GAAGuB,KAAK,CAACZ,EAAE,CAAC,CAAC,CAAC,CAAC,CAAE,CAAC,CAAC;IACtD,OAAO,CAACa,CAAC,EAAEZ,CAAC,EAAEF,CAAC,CAAC;EAClB;AACF","ignoreList":[]}
@@ -0,0 +1,56 @@
1
+ "use strict";
2
+
3
+ // NOTE: This will be implemented in C++
4
+
5
+ export class HypothesisBuffer {
6
+ committedInBuffer = [];
7
+ buffer = [];
8
+ new = [];
9
+ lastCommittedTime = 0;
10
+ lastCommittedWord = null;
11
+ insert(newWords, offset) {
12
+ const newWordsOffset = newWords.map(([a, b, t]) => [a + offset, b + offset, t]);
13
+ this.new = newWordsOffset.filter(([a, _b, _t]) => a > this.lastCommittedTime - 0.5);
14
+ if (this.new.length > 0) {
15
+ const [a, _b, _t] = this.new[0];
16
+ if (Math.abs(a - this.lastCommittedTime) < 1 && this.committedInBuffer.length > 0) {
17
+ const cn = this.committedInBuffer.length;
18
+ const nn = this.new.length;
19
+ for (let i = 1; i <= Math.min(cn, nn, 5); i++) {
20
+ const c = this.committedInBuffer.slice(-i).map(w => w[2]).join(' ');
21
+ const tail = this.new.slice(0, i).map(w => w[2]).join(' ');
22
+ if (c === tail) {
23
+ for (let j = 0; j < i; j++) {
24
+ this.new.shift();
25
+ }
26
+ break;
27
+ }
28
+ }
29
+ }
30
+ }
31
+ }
32
+ flush() {
33
+ const commit = [];
34
+ while (this.new.length > 0 && this.buffer.length > 0) {
35
+ if (this.new[0][2] !== this.buffer[0][2]) {
36
+ break;
37
+ }
38
+ commit.push(this.new[0]);
39
+ this.lastCommittedWord = this.new[0][2];
40
+ this.lastCommittedTime = this.new[0][1];
41
+ this.buffer.shift();
42
+ this.new.shift();
43
+ }
44
+ this.buffer = this.new;
45
+ this.new = [];
46
+ this.committedInBuffer.push(...commit);
47
+ return commit;
48
+ }
49
+ popCommitted(time) {
50
+ this.committedInBuffer = this.committedInBuffer.filter(([_a, b, _t]) => b > time);
51
+ }
52
+ complete() {
53
+ return this.buffer;
54
+ }
55
+ }
56
+ //# sourceMappingURL=hypothesisBuffer.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"names":["HypothesisBuffer","committedInBuffer","buffer","new","lastCommittedTime","lastCommittedWord","insert","newWords","offset","newWordsOffset","map","a","b","t","filter","_b","_t","length","Math","abs","cn","nn","i","min","c","slice","w","join","tail","j","shift","flush","commit","push","popCommitted","time","_a","complete"],"sourceRoot":"../../../../src","sources":["utils/SpeechToTextModule/hypothesisBuffer.ts"],"mappings":";;AAAA;;AAIA,OAAO,MAAMA,gBAAgB,CAAC;EACpBC,iBAAiB,GAAgB,EAAE;EACnCC,MAAM,GAAgB,EAAE;EACxBC,GAAG,GAAgB,EAAE;EAErBC,iBAAiB,GAAW,CAAC;EAC9BC,iBAAiB,GAAkB,IAAI;EAEvCC,MAAMA,CAACC,QAAqB,EAAEC,MAAc,EAAE;IACnD,MAAMC,cAA2B,GAAGF,QAAQ,CAACG,GAAG,CAAC,CAAC,CAACC,CAAC,EAAEC,CAAC,EAAEC,CAAC,CAAC,KAAK,CAC9DF,CAAC,GAAGH,MAAM,EACVI,CAAC,GAAGJ,MAAM,EACVK,CAAC,CACF,CAAC;IACF,IAAI,CAACV,GAAG,GAAGM,cAAc,CAACK,MAAM,CAC9B,CAAC,CAACH,CAAC,EAAEI,EAAE,EAAEC,EAAE,CAAC,KAAKL,CAAC,GAAG,IAAI,CAACP,iBAAiB,GAAG,GAChD,CAAC;IAED,IAAI,IAAI,CAACD,GAAG,CAACc,MAAM,GAAG,CAAC,EAAE;MACvB,MAAM,CAACN,CAAC,EAAEI,EAAE,EAAEC,EAAE,CAAC,GAAG,IAAI,CAACb,GAAG,CAAC,CAAC,CAAE;MAChC,IACEe,IAAI,CAACC,GAAG,CAACR,CAAC,GAAG,IAAI,CAACP,iBAAiB,CAAC,GAAG,CAAC,IACxC,IAAI,CAACH,iBAAiB,CAACgB,MAAM,GAAG,CAAC,EACjC;QACA,MAAMG,EAAE,GAAG,IAAI,CAACnB,iBAAiB,CAACgB,MAAM;QACxC,MAAMI,EAAE,GAAG,IAAI,CAAClB,GAAG,CAACc,MAAM;QAE1B,KAAK,IAAIK,CAAC,GAAG,CAAC,EAAEA,CAAC,IAAIJ,IAAI,CAACK,GAAG,CAACH,EAAE,EAAEC,EAAE,EAAE,CAAC,CAAC,EAAEC,CAAC,EAAE,EAAE;UAC7C,MAAME,CAAC,GAAG,IAAI,CAACvB,iBAAiB,CAC7BwB,KAAK,CAAC,CAACH,CAAC,CAAC,CACTZ,GAAG,CAAEgB,CAAC,IAAKA,CAAC,CAAC,CAAC,CAAC,CAAC,CAChBC,IAAI,CAAC,GAAG,CAAC;UACZ,MAAMC,IAAI,GAAG,IAAI,CAACzB,GAAG,CAClBsB,KAAK,CAAC,CAAC,EAAEH,CAAC,CAAC,CACXZ,GAAG,CAAEgB,CAAC,IAAKA,CAAC,CAAC,CAAC,CAAC,CAAC,CAChBC,IAAI,CAAC,GAAG,CAAC;UACZ,IAAIH,CAAC,KAAKI,IAAI,EAAE;YACd,KAAK,IAAIC,CAAC,GAAG,CAAC,EAAEA,CAAC,GAAGP,CAAC,EAAEO,CAAC,EAAE,EAAE;cAC1B,IAAI,CAAC1B,GAAG,CAAC2B,KAAK,CAAC,CAAC;YAClB;YACA;UACF;QACF;MACF;IACF;EACF;EAEOC,KAAKA,CAAA,EAAgB;IAC1B,MAAMC,MAAmB,GAAG,EAAE;IAC9B,OAAO,IAAI,CAAC7B,GAAG,CAACc,MAAM,GAAG,CAAC,IAAI,IAAI,CAACf,MAAM,CAACe,MAAM,GAAG,CAAC,EAAE;MACpD,IAAI,IAAI,CAACd,GAAG,CAAC,CAAC,CAAC,CAAE,CAAC,CAAC,KAAK,IAAI,CAACD,MAAM,CAAC,CAAC,CAAC,CAAE,CAAC,CAAC,EAAE;QAC1C;MACF;MACA8B,MAAM,CAACC,IAAI,CAAC,IAAI,CAAC9B,GAAG,CAAC,CAAC,CAAE,CAAC;MACzB,IAAI,CAACE,iBAAiB,GAAG,IAAI,CAACF,GAAG,CAAC,CAAC,CAAC,CAAE,CAAC,CAAC;MACxC,IAAI,CAACC,iBAAiB,GAAG,IAAI,CAACD,GAAG,CAAC,CAAC,CAAC,CAAE,CAAC,CAAC;MACxC,IAAI,CAACD,MAAM,CAAC4B,KAAK,CAAC,CAAC;MACnB,IAAI,CAAC3B,GAAG,CAAC2B,KAAK,CAAC,CAAC;IAClB;IACA,IAAI,CAAC5B,MAAM,GAAG,IAAI,CAACC,GAAG;IACtB,IAAI,CAACA,GAAG,GAAG,EAAE;IACb,IAAI,CAACF,iBAAiB,CAACgC,IAAI,CAAC,GAAGD,MAAM,CAAC;IACtC,OAAOA,MAAM;EACf;EAEOE,YAAYA,CAACC,IAAY,EAAE;IAChC,IAAI,CAAClC,iBAAiB,GAAG,IAAI,CAACA,iBAAiB,CAACa,MAAM,CACpD,CAAC,CAACsB,EAAE,EAAExB,CAAC,EAAEI,EAAE,CAAC,KAAKJ,CAAC,GAAGuB,IACvB,CAAC;EACH;EAEOE,QAAQA,CAAA,EAAgB;IAC7B,OAAO,IAAI,CAACnC,MAAM;EACpB;AACF","ignoreList":[]}
@@ -0,0 +1,8 @@
1
+ import { ResourceSource } from '../types/common';
2
+ export declare class BaseModule {
3
+ protected static nativeModule: any;
4
+ static onDownloadProgressCallback: (downloadProgress: number) => void;
5
+ static load(sources: ResourceSource[], ...loadArgs: any[]): Promise<void>;
6
+ protected static forward(..._args: any[]): Promise<any>;
7
+ static onDownloadProgress(callback: (downloadProgress: number) => void): void;
8
+ }
@@ -0,0 +1,25 @@
1
+ import { ResourceFetcher } from '../utils/ResourceFetcher';
2
+ import { getError } from '../Error';
3
+ export class BaseModule {
4
+ static nativeModule;
5
+ static onDownloadProgressCallback = () => { };
6
+ static async load(sources, ...loadArgs // this can be used in derived classes to pass extra args to load method
7
+ ) {
8
+ try {
9
+ const paths = await ResourceFetcher.fetch(this.onDownloadProgressCallback, ...sources);
10
+ if (paths === null || paths.length < sources.length) {
11
+ throw new Error('Download interrupted.');
12
+ }
13
+ await this.nativeModule.loadModule(...paths, ...loadArgs);
14
+ }
15
+ catch (error) {
16
+ throw new Error(getError(error));
17
+ }
18
+ }
19
+ static async forward(..._args) {
20
+ throw new Error('forward method is not implemented in the BaseModule class. Please implement it in the derived class.');
21
+ }
22
+ static onDownloadProgress(callback) {
23
+ this.onDownloadProgressCallback = callback;
24
+ }
25
+ }
@@ -0,0 +1,9 @@
1
+ import { ResourceSource } from '../types/common';
2
+ import { TensorPtr } from '../types/common';
3
+ export declare abstract class BaseNonStaticModule {
4
+ nativeModule: any;
5
+ abstract load(modelSource: ResourceSource, onDownloadProgressCallback: (_: number) => void, ...args: any[]): Promise<void>;
6
+ protected forwardET(inputTensor: TensorPtr[]): Promise<TensorPtr[]>;
7
+ getInputShape(methodName: string, index: number): Promise<number[]>;
8
+ delete(): void;
9
+ }
@@ -0,0 +1,14 @@
1
+ export class BaseNonStaticModule {
2
+ nativeModule = null;
3
+ async forwardET(inputTensor) {
4
+ return await this.nativeModule.forward(inputTensor);
5
+ }
6
+ async getInputShape(methodName, index) {
7
+ return this.nativeModule.getInputShape(methodName, index);
8
+ }
9
+ delete() {
10
+ if (this.nativeModule !== null) {
11
+ this.nativeModule.unload();
12
+ }
13
+ }
14
+ }
@@ -0,0 +1,8 @@
1
+ import { ResourceSource } from '../../types/common';
2
+ import { BaseNonStaticModule } from '../BaseNonStaticModule';
3
+ export declare class ClassificationModule extends BaseNonStaticModule {
4
+ load(model: {
5
+ modelSource: ResourceSource;
6
+ }, onDownloadProgressCallback?: (progress: number) => void): Promise<void>;
7
+ forward(imageSource: string): Promise<any>;
8
+ }
@@ -0,0 +1,17 @@
1
+ import { ResourceFetcher } from '../../utils/ResourceFetcher';
2
+ import { ETError, getError } from '../../Error';
3
+ import { BaseNonStaticModule } from '../BaseNonStaticModule';
4
+ export class ClassificationModule extends BaseNonStaticModule {
5
+ async load(model, onDownloadProgressCallback = () => { }) {
6
+ const paths = await ResourceFetcher.fetch(onDownloadProgressCallback, model.modelSource);
7
+ if (paths === null || paths.length < 1) {
8
+ throw new Error('Download interrupted.');
9
+ }
10
+ this.nativeModule = global.loadClassification(paths[0] || '');
11
+ }
12
+ async forward(imageSource) {
13
+ if (this.nativeModule == null)
14
+ throw new Error(getError(ETError.ModuleNotLoaded));
15
+ return await this.nativeModule.generate(imageSource);
16
+ }
17
+ }
@@ -0,0 +1,8 @@
1
+ import { ResourceSource } from '../../types/common';
2
+ import { BaseNonStaticModule } from '../BaseNonStaticModule';
3
+ export declare class ImageEmbeddingsModule extends BaseNonStaticModule {
4
+ load(model: {
5
+ modelSource: ResourceSource;
6
+ }, onDownloadProgressCallback?: (progress: number) => void): Promise<void>;
7
+ forward(imageSource: string): Promise<Float32Array>;
8
+ }
@@ -0,0 +1,17 @@
1
+ import { ResourceFetcher } from '../../utils/ResourceFetcher';
2
+ import { ETError, getError } from '../../Error';
3
+ import { BaseNonStaticModule } from '../BaseNonStaticModule';
4
+ export class ImageEmbeddingsModule extends BaseNonStaticModule {
5
+ async load(model, onDownloadProgressCallback = () => { }) {
6
+ const paths = await ResourceFetcher.fetch(onDownloadProgressCallback, model.modelSource);
7
+ if (paths === null || paths.length < 1) {
8
+ throw new Error('Download interrupted.');
9
+ }
10
+ this.nativeModule = global.loadImageEmbeddings(paths[0] || '');
11
+ }
12
+ async forward(imageSource) {
13
+ if (this.nativeModule == null)
14
+ throw new Error(getError(ETError.ModuleNotLoaded));
15
+ return new Float32Array(await this.nativeModule.generate(imageSource));
16
+ }
17
+ }
@@ -0,0 +1,11 @@
1
+ import { ResourceSource } from '../../types/common';
2
+ import { DeeplabLabel } from '../../types/imageSegmentation';
3
+ import { BaseNonStaticModule } from '../BaseNonStaticModule';
4
+ export declare class ImageSegmentationModule extends BaseNonStaticModule {
5
+ load(model: {
6
+ modelSource: ResourceSource;
7
+ }, onDownloadProgressCallback?: (progress: number) => void): Promise<void>;
8
+ forward(imageSource: string, classesOfInterest?: DeeplabLabel[], resize?: boolean): Promise<{
9
+ [key in DeeplabLabel]?: number[];
10
+ }>;
11
+ }
@@ -0,0 +1,27 @@
1
+ import { ResourceFetcher } from '../../utils/ResourceFetcher';
2
+ import { DeeplabLabel } from '../../types/imageSegmentation';
3
+ import { ETError, getError } from '../../Error';
4
+ import { BaseNonStaticModule } from '../BaseNonStaticModule';
5
+ export class ImageSegmentationModule extends BaseNonStaticModule {
6
+ async load(model, onDownloadProgressCallback = () => { }) {
7
+ const paths = await ResourceFetcher.fetch(onDownloadProgressCallback, model.modelSource);
8
+ if (paths === null || paths.length < 1) {
9
+ throw new Error('Download interrupted.');
10
+ }
11
+ this.nativeModule = global.loadImageSegmentation(paths[0] || '');
12
+ }
13
+ async forward(imageSource, classesOfInterest, resize) {
14
+ if (this.nativeModule == null) {
15
+ throw new Error(getError(ETError.ModuleNotLoaded));
16
+ }
17
+ const stringDict = await this.nativeModule.generate(imageSource, (classesOfInterest || []).map((label) => DeeplabLabel[label]), resize || false);
18
+ let enumDict = {};
19
+ for (const key in stringDict) {
20
+ if (key in DeeplabLabel) {
21
+ const enumKey = DeeplabLabel[key];
22
+ enumDict[enumKey] = stringDict[key];
23
+ }
24
+ }
25
+ return enumDict;
26
+ }
27
+ }
@@ -0,0 +1,15 @@
1
+ import { ResourceSource } from '../../types/common';
2
+ import { OCRLanguage } from '../../types/ocr';
3
+ export declare class OCRModule {
4
+ private controller;
5
+ constructor();
6
+ load(model: {
7
+ detectorSource: ResourceSource;
8
+ recognizerLarge: ResourceSource;
9
+ recognizerMedium: ResourceSource;
10
+ recognizerSmall: ResourceSource;
11
+ language: OCRLanguage;
12
+ }, onDownloadProgressCallback?: (progress: number) => void): Promise<void>;
13
+ forward(input: string): Promise<any>;
14
+ delete(): void;
15
+ }
@@ -0,0 +1,20 @@
1
+ import { OCRController } from '../../controllers/OCRController';
2
+ export class OCRModule {
3
+ controller;
4
+ constructor() {
5
+ this.controller = new OCRController();
6
+ }
7
+ async load(model, onDownloadProgressCallback = () => { }) {
8
+ await this.controller.load(model.detectorSource, {
9
+ recognizerLarge: model.recognizerLarge,
10
+ recognizerMedium: model.recognizerMedium,
11
+ recognizerSmall: model.recognizerSmall,
12
+ }, model.language, onDownloadProgressCallback);
13
+ }
14
+ async forward(input) {
15
+ return await this.controller.forward(input);
16
+ }
17
+ delete() {
18
+ this.controller.delete();
19
+ }
20
+ }
@@ -0,0 +1,9 @@
1
+ import { ResourceSource } from '../../types/common';
2
+ import { Detection } from '../../types/objectDetection';
3
+ import { BaseNonStaticModule } from '../BaseNonStaticModule';
4
+ export declare class ObjectDetectionModule extends BaseNonStaticModule {
5
+ load(model: {
6
+ modelSource: ResourceSource;
7
+ }, onDownloadProgressCallback?: (progress: number) => void): Promise<void>;
8
+ forward(imageSource: string, detectionThreshold?: number): Promise<Detection[]>;
9
+ }
@@ -0,0 +1,17 @@
1
+ import { ResourceFetcher } from '../../utils/ResourceFetcher';
2
+ import { ETError, getError } from '../../Error';
3
+ import { BaseNonStaticModule } from '../BaseNonStaticModule';
4
+ export class ObjectDetectionModule extends BaseNonStaticModule {
5
+ async load(model, onDownloadProgressCallback = () => { }) {
6
+ const paths = await ResourceFetcher.fetch(onDownloadProgressCallback, model.modelSource);
7
+ if (paths === null || paths.length < 1) {
8
+ throw new Error('Download interrupted.');
9
+ }
10
+ this.nativeModule = global.loadObjectDetection(paths[0] || '');
11
+ }
12
+ async forward(imageSource, detectionThreshold = 0.7) {
13
+ if (this.nativeModule == null)
14
+ throw new Error(getError(ETError.ModuleNotLoaded));
15
+ return await this.nativeModule.generate(imageSource, detectionThreshold);
16
+ }
17
+ }
@@ -0,0 +1,8 @@
1
+ import { ResourceSource } from '../../types/common';
2
+ import { BaseNonStaticModule } from '../BaseNonStaticModule';
3
+ export declare class StyleTransferModule extends BaseNonStaticModule {
4
+ load(model: {
5
+ modelSource: ResourceSource;
6
+ }, onDownloadProgressCallback?: (progress: number) => void): Promise<void>;
7
+ forward(imageSource: string): Promise<string>;
8
+ }
@@ -0,0 +1,17 @@
1
+ import { ResourceFetcher } from '../../utils/ResourceFetcher';
2
+ import { ETError, getError } from '../../Error';
3
+ import { BaseNonStaticModule } from '../BaseNonStaticModule';
4
+ export class StyleTransferModule extends BaseNonStaticModule {
5
+ async load(model, onDownloadProgressCallback = () => { }) {
6
+ const paths = await ResourceFetcher.fetch(onDownloadProgressCallback, model.modelSource);
7
+ if (paths === null || paths.length < 1) {
8
+ throw new Error('Download interrupted.');
9
+ }
10
+ this.nativeModule = global.loadStyleTransfer(paths[0] || '');
11
+ }
12
+ async forward(imageSource) {
13
+ if (this.nativeModule == null)
14
+ throw new Error(getError(ETError.ModuleNotLoaded));
15
+ return await this.nativeModule.generate(imageSource);
16
+ }
17
+ }
@@ -0,0 +1,15 @@
1
+ import { ResourceSource } from '../../types/common';
2
+ import { OCRLanguage } from '../../types/ocr';
3
+ export declare class VerticalOCRModule {
4
+ private controller;
5
+ constructor();
6
+ load(model: {
7
+ detectorLarge: ResourceSource;
8
+ detectorNarrow: ResourceSource;
9
+ recognizerLarge: ResourceSource;
10
+ recognizerSmall: ResourceSource;
11
+ language: OCRLanguage;
12
+ }, independentCharacters: boolean, onDownloadProgressCallback?: (progress: number) => void): Promise<void>;
13
+ forward(input: string): Promise<any>;
14
+ delete(): void;
15
+ }