react-native-executorch 0.5.1-rc.0 → 0.5.2
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +132 -0
- package/common/rnexecutorch/models/speech_to_text/SpeechToText.cpp +4 -10
- package/common/rnexecutorch/models/speech_to_text/SpeechToText.h +1 -1
- package/common/rnexecutorch/models/speech_to_text/SpeechToTextStrategy.h +3 -2
- package/common/rnexecutorch/models/speech_to_text/WhisperStrategy.cpp +16 -4
- package/common/rnexecutorch/models/speech_to_text/WhisperStrategy.h +2 -2
- package/lib/Error.d.ts +30 -0
- package/lib/Error.js +50 -0
- package/lib/constants/directories.d.ts +1 -0
- package/lib/constants/directories.js +2 -0
- package/lib/constants/llmDefaults.d.ts +6 -0
- package/lib/constants/llmDefaults.js +16 -0
- package/lib/constants/modelUrls.d.ts +217 -83
- package/lib/constants/modelUrls.js +304 -98
- package/lib/constants/ocr/models.d.ts +882 -0
- package/lib/constants/ocr/models.js +182 -0
- package/lib/constants/ocr/symbols.d.ts +75 -0
- package/lib/constants/ocr/symbols.js +139 -0
- package/lib/{typescript/constants → constants}/sttDefaults.d.ts +0 -1
- package/lib/constants/sttDefaults.js +12 -10
- package/lib/controllers/LLMController.d.ts +47 -0
- package/lib/controllers/LLMController.js +14 -11
- package/lib/controllers/OCRController.d.ts +23 -0
- package/lib/controllers/OCRController.js +12 -5
- package/lib/controllers/SpeechToTextController.d.ts +8 -4
- package/lib/controllers/SpeechToTextController.js +15 -9
- package/lib/controllers/VerticalOCRController.d.ts +25 -0
- package/lib/controllers/VerticalOCRController.js +75 -0
- package/lib/hooks/computer_vision/useClassification.d.ts +15 -0
- package/lib/hooks/computer_vision/useClassification.js +7 -0
- package/lib/hooks/computer_vision/useImageEmbeddings.d.ts +15 -0
- package/lib/hooks/computer_vision/useImageEmbeddings.js +7 -0
- package/lib/hooks/computer_vision/useImageSegmentation.d.ts +38 -0
- package/lib/hooks/computer_vision/useImageSegmentation.js +7 -0
- package/lib/hooks/computer_vision/useOCR.d.ts +20 -0
- package/lib/hooks/computer_vision/useOCR.js +42 -0
- package/lib/hooks/computer_vision/useObjectDetection.d.ts +15 -0
- package/lib/hooks/computer_vision/useObjectDetection.js +7 -0
- package/lib/hooks/computer_vision/useStyleTransfer.d.ts +15 -0
- package/lib/hooks/computer_vision/useStyleTransfer.js +7 -0
- package/lib/hooks/computer_vision/useVerticalOCR.d.ts +21 -0
- package/lib/hooks/computer_vision/useVerticalOCR.js +45 -0
- package/lib/hooks/general/useExecutorchModule.d.ts +13 -0
- package/lib/hooks/general/useExecutorchModule.js +7 -0
- package/lib/hooks/natural_language_processing/useLLM.d.ts +10 -0
- package/lib/hooks/natural_language_processing/useLLM.js +78 -0
- package/lib/hooks/natural_language_processing/useSpeechToText.d.ts +27 -0
- package/lib/hooks/natural_language_processing/useSpeechToText.js +19 -14
- package/lib/hooks/natural_language_processing/useTextEmbeddings.d.ts +16 -0
- package/lib/hooks/natural_language_processing/useTextEmbeddings.js +7 -0
- package/lib/hooks/natural_language_processing/useTokenizer.d.ts +17 -0
- package/lib/hooks/natural_language_processing/useTokenizer.js +52 -0
- package/lib/hooks/useModule.d.ts +17 -0
- package/lib/hooks/useModule.js +45 -0
- package/lib/hooks/useNonStaticModule.d.ts +20 -0
- package/lib/hooks/useNonStaticModule.js +49 -0
- package/lib/index.d.ts +1 -1
- package/lib/index.js +3 -2
- package/lib/module/constants/modelUrls.js +61 -36
- package/lib/module/constants/modelUrls.js.map +1 -1
- package/lib/module/constants/ocr/models.js +1 -1
- package/lib/module/hooks/natural_language_processing/useSpeechToText.js +71 -34
- package/lib/module/hooks/natural_language_processing/useSpeechToText.js.map +1 -1
- package/lib/module/index.js +2 -3
- package/lib/module/index.js.map +1 -1
- package/lib/module/modules/natural_language_processing/SpeechToTextModule.js +72 -31
- package/lib/module/modules/natural_language_processing/SpeechToTextModule.js.map +1 -1
- package/lib/module/types/stt.js +1 -85
- package/lib/module/types/stt.js.map +1 -1
- package/lib/module/utils/ResourceFetcher.js +6 -8
- package/lib/module/utils/ResourceFetcher.js.map +1 -1
- package/lib/module/utils/ResourceFetcherUtils.js +20 -20
- package/lib/module/utils/ResourceFetcherUtils.js.map +1 -1
- package/lib/module/utils/SpeechToTextModule/ASR.js +191 -0
- package/lib/module/utils/SpeechToTextModule/ASR.js.map +1 -0
- package/lib/module/utils/SpeechToTextModule/OnlineProcessor.js +73 -0
- package/lib/module/utils/SpeechToTextModule/OnlineProcessor.js.map +1 -0
- package/lib/module/utils/SpeechToTextModule/hypothesisBuffer.js +56 -0
- package/lib/module/utils/SpeechToTextModule/hypothesisBuffer.js.map +1 -0
- package/lib/modules/BaseModule.d.ts +8 -0
- package/lib/modules/BaseModule.js +25 -0
- package/lib/modules/BaseNonStaticModule.d.ts +9 -0
- package/lib/modules/BaseNonStaticModule.js +14 -0
- package/lib/modules/computer_vision/ClassificationModule.d.ts +8 -0
- package/lib/modules/computer_vision/ClassificationModule.js +17 -0
- package/lib/modules/computer_vision/ImageEmbeddingsModule.d.ts +8 -0
- package/lib/modules/computer_vision/ImageEmbeddingsModule.js +17 -0
- package/lib/modules/computer_vision/ImageSegmentationModule.d.ts +11 -0
- package/lib/modules/computer_vision/ImageSegmentationModule.js +27 -0
- package/lib/modules/computer_vision/OCRModule.d.ts +15 -0
- package/lib/modules/computer_vision/OCRModule.js +20 -0
- package/lib/modules/computer_vision/ObjectDetectionModule.d.ts +9 -0
- package/lib/modules/computer_vision/ObjectDetectionModule.js +17 -0
- package/lib/modules/computer_vision/StyleTransferModule.d.ts +8 -0
- package/lib/modules/computer_vision/StyleTransferModule.js +17 -0
- package/lib/modules/computer_vision/VerticalOCRModule.d.ts +15 -0
- package/lib/modules/computer_vision/VerticalOCRModule.js +22 -0
- package/lib/modules/general/ExecutorchModule.d.ts +7 -0
- package/lib/modules/general/ExecutorchModule.js +14 -0
- package/lib/modules/natural_language_processing/LLMModule.d.ts +28 -0
- package/lib/modules/natural_language_processing/LLMModule.js +45 -0
- package/lib/modules/natural_language_processing/SpeechToTextModule.d.ts +18 -8
- package/lib/modules/natural_language_processing/SpeechToTextModule.js +21 -15
- package/lib/modules/natural_language_processing/TextEmbeddingsModule.d.ts +9 -0
- package/lib/modules/natural_language_processing/TextEmbeddingsModule.js +21 -0
- package/lib/modules/natural_language_processing/TokenizerModule.d.ts +12 -0
- package/lib/modules/natural_language_processing/TokenizerModule.js +5 -4
- package/lib/native/NativeETInstaller.d.ts +6 -0
- package/lib/native/NativeETInstaller.js +2 -0
- package/lib/native/NativeOCR.d.ts +8 -0
- package/lib/native/NativeOCR.js +2 -0
- package/lib/native/NativeVerticalOCR.d.ts +8 -0
- package/lib/native/NativeVerticalOCR.js +2 -0
- package/lib/types/common.d.ts +31 -0
- package/lib/types/common.js +25 -0
- package/lib/types/imageSegmentation.d.ts +24 -0
- package/lib/types/imageSegmentation.js +26 -0
- package/lib/types/llm.d.ts +46 -0
- package/lib/types/llm.js +9 -0
- package/lib/types/objectDetection.d.ts +104 -0
- package/lib/types/objectDetection.js +94 -0
- package/lib/types/ocr.d.ts +11 -0
- package/lib/types/ocr.js +1 -0
- package/lib/types/stt.d.ts +94 -0
- package/lib/types/stt.js +85 -0
- package/lib/typescript/constants/modelUrls.d.ts +24 -7
- package/lib/typescript/constants/modelUrls.d.ts.map +1 -1
- package/lib/typescript/constants/ocr/models.d.ts +126 -126
- package/lib/typescript/hooks/natural_language_processing/useSpeechToText.d.ts +15 -24
- package/lib/typescript/hooks/natural_language_processing/useSpeechToText.d.ts.map +1 -1
- package/lib/typescript/index.d.ts +2 -3
- package/lib/typescript/index.d.ts.map +1 -1
- package/lib/typescript/modules/natural_language_processing/SpeechToTextModule.d.ts +19 -22
- package/lib/typescript/modules/natural_language_processing/SpeechToTextModule.d.ts.map +1 -1
- package/lib/typescript/types/stt.d.ts +17 -91
- package/lib/typescript/types/stt.d.ts.map +1 -1
- package/lib/typescript/utils/ResourceFetcher.d.ts.map +1 -1
- package/lib/typescript/utils/ResourceFetcherUtils.d.ts.map +1 -1
- package/lib/typescript/utils/SpeechToTextModule/ASR.d.ts +27 -0
- package/lib/typescript/utils/SpeechToTextModule/ASR.d.ts.map +1 -0
- package/lib/typescript/utils/SpeechToTextModule/OnlineProcessor.d.ts +23 -0
- package/lib/typescript/utils/SpeechToTextModule/OnlineProcessor.d.ts.map +1 -0
- package/lib/typescript/utils/SpeechToTextModule/hypothesisBuffer.d.ts +13 -0
- package/lib/typescript/utils/SpeechToTextModule/hypothesisBuffer.d.ts.map +1 -0
- package/lib/utils/ResourceFetcher.d.ts +24 -0
- package/lib/utils/ResourceFetcher.js +305 -0
- package/lib/utils/ResourceFetcherUtils.d.ts +54 -0
- package/lib/utils/ResourceFetcherUtils.js +9 -0
- package/lib/utils/llm.d.ts +6 -0
- package/lib/utils/llm.js +1 -0
- package/lib/utils/stt.d.ts +1 -0
- package/lib/utils/stt.js +21 -0
- package/package.json +5 -3
- package/src/constants/modelUrls.ts +70 -37
- package/src/constants/ocr/models.ts +1 -1
- package/src/hooks/natural_language_processing/useSpeechToText.ts +87 -92
- package/src/index.ts +6 -8
- package/src/modules/natural_language_processing/SpeechToTextModule.ts +81 -69
- package/src/types/stt.ts +97 -92
- package/src/utils/ResourceFetcher.ts +9 -7
- package/src/utils/ResourceFetcherUtils.ts +15 -17
- package/src/utils/SpeechToTextModule/ASR.ts +303 -0
- package/src/utils/SpeechToTextModule/OnlineProcessor.ts +87 -0
- package/src/utils/SpeechToTextModule/hypothesisBuffer.ts +79 -0
- package/common/rnexecutorch/models/speech_to_text/MoonshineStrategy.cpp +0 -31
- package/common/rnexecutorch/models/speech_to_text/MoonshineStrategy.h +0 -21
- package/lib/module/constants/sttDefaults.js +0 -74
- package/lib/module/constants/sttDefaults.js.map +0 -1
- package/lib/module/controllers/SpeechToTextController.js +0 -320
- package/lib/module/controllers/SpeechToTextController.js.map +0 -1
- package/lib/typescript/constants/sttDefaults.d.ts.map +0 -1
- package/lib/typescript/controllers/SpeechToTextController.d.ts +0 -57
- package/lib/typescript/controllers/SpeechToTextController.d.ts.map +0 -1
- package/src/constants/sttDefaults.ts +0 -82
- package/src/controllers/SpeechToTextController.ts +0 -471
- package/third-party/ios/ExecutorchLib/ExecutorchLib.xcodeproj/project.xcworkspace/contents.xcworkspacedata +0 -7
- package/third-party/ios/ExecutorchLib/ExecutorchLib.xcodeproj/project.xcworkspace/xcuserdata/norbertklockiewicz.xcuserdatad/UserInterfaceState.xcuserstate +0 -0
- package/third-party/ios/ExecutorchLib/ExecutorchLib.xcodeproj/xcuserdata/norbertklockiewicz.xcuserdatad/xcschemes/xcschememanagement.plist +0 -14
|
@@ -0,0 +1,191 @@
|
|
|
1
|
+
"use strict";
|
|
2
|
+
|
|
3
|
+
// NOTE: This will be implemented in C++
|
|
4
|
+
|
|
5
|
+
import { TokenizerModule } from '../../modules/natural_language_processing/TokenizerModule';
|
|
6
|
+
import { ResourceFetcher } from '../ResourceFetcher';
|
|
7
|
+
export class ASR {
|
|
8
|
+
tokenizerModule = new TokenizerModule();
|
|
9
|
+
timePrecision = 0.02; // Whisper timestamp precision
|
|
10
|
+
maxDecodeLength = 128;
|
|
11
|
+
chunkSize = 30; // 30 seconds
|
|
12
|
+
minChunkSamples = 1 * 16000; // 1 second
|
|
13
|
+
samplingRate = 16000;
|
|
14
|
+
async load(model, onDownloadProgressCallback) {
|
|
15
|
+
const tokenizerLoadPromise = this.tokenizerModule.load(model);
|
|
16
|
+
const encoderDecoderPromise = ResourceFetcher.fetch(onDownloadProgressCallback, model.encoderSource, model.decoderSource);
|
|
17
|
+
const [_, encoderDecoderResults] = await Promise.all([tokenizerLoadPromise, encoderDecoderPromise]);
|
|
18
|
+
const encoderSource = encoderDecoderResults?.[0];
|
|
19
|
+
const decoderSource = encoderDecoderResults?.[1];
|
|
20
|
+
if (!encoderSource || !decoderSource) {
|
|
21
|
+
throw new Error('Download interrupted.');
|
|
22
|
+
}
|
|
23
|
+
this.nativeModule = await global.loadSpeechToText(encoderSource, decoderSource, 'whisper');
|
|
24
|
+
this.startOfTranscriptToken = await this.tokenizerModule.tokenToId('<|startoftranscript|>');
|
|
25
|
+
this.endOfTextToken = await this.tokenizerModule.tokenToId('<|endoftext|>');
|
|
26
|
+
this.timestampBeginToken = await this.tokenizerModule.tokenToId('<|0.00|>');
|
|
27
|
+
}
|
|
28
|
+
async getInitialSequence(options) {
|
|
29
|
+
const initialSequence = [this.startOfTranscriptToken];
|
|
30
|
+
if (options.language) {
|
|
31
|
+
const languageToken = await this.tokenizerModule.tokenToId(`<|${options.language}|>`);
|
|
32
|
+
const taskToken = await this.tokenizerModule.tokenToId('<|transcribe|>');
|
|
33
|
+
initialSequence.push(languageToken);
|
|
34
|
+
initialSequence.push(taskToken);
|
|
35
|
+
}
|
|
36
|
+
initialSequence.push(this.timestampBeginToken);
|
|
37
|
+
return initialSequence;
|
|
38
|
+
}
|
|
39
|
+
async generate(audio, temperature, options) {
|
|
40
|
+
await this.encode(new Float32Array(audio));
|
|
41
|
+
const initialSequence = await this.getInitialSequence(options);
|
|
42
|
+
const sequencesIds = [...initialSequence];
|
|
43
|
+
const scores = [];
|
|
44
|
+
while (sequencesIds.length <= this.maxDecodeLength) {
|
|
45
|
+
const logits = this.softmaxWithTemperature(Array.from(await this.decode(sequencesIds)), temperature === 0 ? 1 : temperature);
|
|
46
|
+
const nextTokenId = temperature === 0 ? logits.indexOf(Math.max(...logits)) : this.sampleFromDistribution(logits);
|
|
47
|
+
const nextTokenProb = logits[nextTokenId];
|
|
48
|
+
sequencesIds.push(nextTokenId);
|
|
49
|
+
scores.push(nextTokenProb);
|
|
50
|
+
if (nextTokenId === this.endOfTextToken) {
|
|
51
|
+
break;
|
|
52
|
+
}
|
|
53
|
+
}
|
|
54
|
+
return {
|
|
55
|
+
sequencesIds: sequencesIds.slice(initialSequence.length),
|
|
56
|
+
scores: scores.slice(initialSequence.length)
|
|
57
|
+
};
|
|
58
|
+
}
|
|
59
|
+
softmaxWithTemperature(logits, temperature = 1.0) {
|
|
60
|
+
const max = Math.max(...logits);
|
|
61
|
+
const exps = logits.map(logit => Math.exp((logit - max) / temperature));
|
|
62
|
+
const sum = exps.reduce((a, b) => a + b, 0);
|
|
63
|
+
return exps.map(exp => exp / sum);
|
|
64
|
+
}
|
|
65
|
+
sampleFromDistribution(probs) {
|
|
66
|
+
const r = Math.random();
|
|
67
|
+
let cumulative = 0;
|
|
68
|
+
for (let i = 0; i < probs.length; i++) {
|
|
69
|
+
cumulative += probs[i];
|
|
70
|
+
if (r < cumulative) {
|
|
71
|
+
return i;
|
|
72
|
+
}
|
|
73
|
+
}
|
|
74
|
+
return probs.length - 1;
|
|
75
|
+
}
|
|
76
|
+
async generateWithFallback(audio, options) {
|
|
77
|
+
const temperatures = [0.0, 0.2, 0.4, 0.6, 0.8, 1.0];
|
|
78
|
+
let generatedTokens = [];
|
|
79
|
+
for (const temperature of temperatures) {
|
|
80
|
+
const result = await this.generate(audio, temperature, options);
|
|
81
|
+
const tokens = result.sequencesIds;
|
|
82
|
+
const scores = result.scores;
|
|
83
|
+
const seqLen = tokens.length;
|
|
84
|
+
const cumLogProb = scores.reduce((acc, score) => acc + Math.log(score), 0);
|
|
85
|
+
const avgLogProb = cumLogProb / seqLen;
|
|
86
|
+
if (avgLogProb >= -1.0) {
|
|
87
|
+
generatedTokens = tokens;
|
|
88
|
+
break;
|
|
89
|
+
}
|
|
90
|
+
}
|
|
91
|
+
return this.calculateWordLevelTimestamps(generatedTokens, audio);
|
|
92
|
+
}
|
|
93
|
+
async calculateWordLevelTimestamps(generatedTokens, audio) {
|
|
94
|
+
const segments = [];
|
|
95
|
+
let tokens = [];
|
|
96
|
+
let prevTimestamp = this.timestampBeginToken;
|
|
97
|
+
for (let i = 0; i < generatedTokens.length; i++) {
|
|
98
|
+
if (generatedTokens[i] < this.timestampBeginToken) {
|
|
99
|
+
tokens.push(generatedTokens[i]);
|
|
100
|
+
}
|
|
101
|
+
if (i > 0 && generatedTokens[i - 1] >= this.timestampBeginToken && generatedTokens[i] >= this.timestampBeginToken) {
|
|
102
|
+
const start = prevTimestamp;
|
|
103
|
+
const end = generatedTokens[i - 1];
|
|
104
|
+
const wordObjects = await this.estimateWordTimestampsLinear(tokens, start, end);
|
|
105
|
+
segments.push({
|
|
106
|
+
words: wordObjects
|
|
107
|
+
});
|
|
108
|
+
tokens = [];
|
|
109
|
+
prevTimestamp = generatedTokens[i];
|
|
110
|
+
}
|
|
111
|
+
}
|
|
112
|
+
const start = prevTimestamp;
|
|
113
|
+
const end = generatedTokens.at(-2);
|
|
114
|
+
const wordObjects = await this.estimateWordTimestampsLinear(tokens, start, end);
|
|
115
|
+
segments.push({
|
|
116
|
+
words: wordObjects
|
|
117
|
+
});
|
|
118
|
+
const scalingFactor = audio.length / this.samplingRate / ((end - this.timestampBeginToken) * this.timePrecision);
|
|
119
|
+
if (scalingFactor < 1) {
|
|
120
|
+
for (const segment of segments) {
|
|
121
|
+
for (const word of segment.words) {
|
|
122
|
+
word.start *= scalingFactor;
|
|
123
|
+
word.end *= scalingFactor;
|
|
124
|
+
}
|
|
125
|
+
}
|
|
126
|
+
}
|
|
127
|
+
return segments;
|
|
128
|
+
}
|
|
129
|
+
async estimateWordTimestampsLinear(tokens, start, end) {
|
|
130
|
+
const duration = (end - start) * this.timePrecision;
|
|
131
|
+
const segmentText = (await this.tokenizerModule.decode(tokens)).trim();
|
|
132
|
+
const words = segmentText.split(' ').map(w => ` ${w}`);
|
|
133
|
+
const numOfCharacters = words.reduce((acc, word) => acc + word.length, 0);
|
|
134
|
+
const timePerCharacter = duration / numOfCharacters;
|
|
135
|
+
const wordObjects = [];
|
|
136
|
+
const startTimeOffset = (start - this.timestampBeginToken) * this.timePrecision;
|
|
137
|
+
let prevCharNum = 0;
|
|
138
|
+
for (let j = 0; j < words.length; j++) {
|
|
139
|
+
const word = words[j];
|
|
140
|
+
const start = startTimeOffset + prevCharNum * timePerCharacter;
|
|
141
|
+
const end = start + timePerCharacter * word.length;
|
|
142
|
+
wordObjects.push({
|
|
143
|
+
word,
|
|
144
|
+
start,
|
|
145
|
+
end
|
|
146
|
+
});
|
|
147
|
+
prevCharNum += word.length;
|
|
148
|
+
}
|
|
149
|
+
return wordObjects;
|
|
150
|
+
}
|
|
151
|
+
async transcribe(audio, options) {
|
|
152
|
+
let seek = 0;
|
|
153
|
+
const allSegments = [];
|
|
154
|
+
while (seek * this.samplingRate < audio.length) {
|
|
155
|
+
const chunk = audio.slice(seek * this.samplingRate, (seek + this.chunkSize) * this.samplingRate);
|
|
156
|
+
if (chunk.length < this.minChunkSamples) {
|
|
157
|
+
return allSegments;
|
|
158
|
+
}
|
|
159
|
+
const segments = await this.generateWithFallback(chunk, options);
|
|
160
|
+
for (const segment of segments) {
|
|
161
|
+
for (const word of segment.words) {
|
|
162
|
+
word.start += seek;
|
|
163
|
+
word.end += seek;
|
|
164
|
+
}
|
|
165
|
+
}
|
|
166
|
+
allSegments.push(...segments);
|
|
167
|
+
const lastTimeStamp = segments.at(-1).words.at(-1).end;
|
|
168
|
+
seek = lastTimeStamp;
|
|
169
|
+
}
|
|
170
|
+
return allSegments;
|
|
171
|
+
}
|
|
172
|
+
tsWords(segments) {
|
|
173
|
+
const o = [];
|
|
174
|
+
for (const segment of segments) {
|
|
175
|
+
for (const word of segment.words) {
|
|
176
|
+
o.push([word.start, word.end, word.word]);
|
|
177
|
+
}
|
|
178
|
+
}
|
|
179
|
+
return o;
|
|
180
|
+
}
|
|
181
|
+
segmentsEndTs(res) {
|
|
182
|
+
return res.map(segment => segment.words.at(-1).end);
|
|
183
|
+
}
|
|
184
|
+
async encode(waveform) {
|
|
185
|
+
await this.nativeModule.encode(waveform);
|
|
186
|
+
}
|
|
187
|
+
async decode(tokens) {
|
|
188
|
+
return new Float32Array(await this.nativeModule.decode(tokens));
|
|
189
|
+
}
|
|
190
|
+
}
|
|
191
|
+
//# sourceMappingURL=ASR.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"names":["TokenizerModule","ResourceFetcher","ASR","tokenizerModule","timePrecision","maxDecodeLength","chunkSize","minChunkSamples","samplingRate","load","model","onDownloadProgressCallback","tokenizerLoadPromise","encoderDecoderPromise","fetch","encoderSource","decoderSource","_","encoderDecoderResults","Promise","all","Error","nativeModule","global","loadSpeechToText","startOfTranscriptToken","tokenToId","endOfTextToken","timestampBeginToken","getInitialSequence","options","initialSequence","language","languageToken","taskToken","push","generate","audio","temperature","encode","Float32Array","sequencesIds","scores","length","logits","softmaxWithTemperature","Array","from","decode","nextTokenId","indexOf","Math","max","sampleFromDistribution","nextTokenProb","slice","exps","map","logit","exp","sum","reduce","a","b","probs","r","random","cumulative","i","generateWithFallback","temperatures","generatedTokens","result","tokens","seqLen","cumLogProb","acc","score","log","avgLogProb","calculateWordLevelTimestamps","segments","prevTimestamp","start","end","wordObjects","estimateWordTimestampsLinear","words","at","scalingFactor","segment","word","duration","segmentText","trim","split","w","numOfCharacters","timePerCharacter","startTimeOffset","prevCharNum","j","transcribe","seek","allSegments","chunk","lastTimeStamp","tsWords","o","segmentsEndTs","res","waveform"],"sourceRoot":"../../../../src","sources":["utils/SpeechToTextModule/ASR.ts"],"mappings":";;AAAA;;AAEA,SAASA,eAAe,QAAQ,2DAA2D;AAQ3F,SAASC,eAAe,QAAQ,oBAAoB;AAEpD,OAAO,MAAMC,GAAG,CAAC;EAEPC,eAAe,GAAoB,IAAIH,eAAe,CAAC,CAAC;EAExDI,aAAa,GAAW,IAAI,CAAC,CAAC;EAC9BC,eAAe,GAAW,GAAG;EAC7BC,SAAS,GAAW,EAAE,CAAC,CAAC;EACxBC,eAAe,GAAW,CAAC,GAAG,KAAK,CAAC,CAAC;EACrCC,YAAY,GAAW,KAAK;EAMpC,MAAaC,IAAIA,CACfC,KAA8B,EAC9BC,0BAAsD,EACtD;IACA,MAAMC,oBAAoB,GAAG,IAAI,CAACT,eAAe,CAACM,IAAI,CAACC,KAAK,CAAC;IAC7D,MAAMG,qBAAqB,GAAGZ,eAAe,CAACa,KAAK,CACjDH,0BAA0B,EAC1BD,KAAK,CAACK,aAAa,EACnBL,KAAK,CAACM,aACR,CAAC;IACD,MAAM,CAACC,CAAC,EAAEC,qBAAqB,CAAC,GAAG,MAAMC,OAAO,CAACC,GAAG,CAAC,CACnDR,oBAAoB,EACpBC,qBAAqB,CACtB,CAAC;IACF,MAAME,aAAa,GAAGG,qBAAqB,GAAG,CAAC,CAAC;IAChD,MAAMF,aAAa,GAAGE,qBAAqB,GAAG,CAAC,CAAC;IAChD,IAAI,CAACH,aAAa,IAAI,CAACC,aAAa,EAAE;MACpC,MAAM,IAAIK,KAAK,CAAC,uBAAuB,CAAC;IAC1C;IACA,IAAI,CAACC,YAAY,GAAG,MAAMC,MAAM,CAACC,gBAAgB,CAC/CT,aAAa,EACbC,aAAa,EACb,SACF,CAAC;IAED,IAAI,CAACS,sBAAsB,GAAG,MAAM,IAAI,CAACtB,eAAe,CAACuB,SAAS,CAChE,uBACF,CAAC;IACD,IAAI,CAACC,cAAc,GAAG,MAAM,IAAI,CAACxB,eAAe,CAACuB,SAAS,CAAC,eAAe,CAAC;IAC3E,IAAI,CAACE,mBAAmB,GAAG,MAAM,IAAI,CAACzB,eAAe,CAACuB,SAAS,CAAC,UAAU,CAAC;EAC7E;EAEA,MAAcG,kBAAkBA,CAC9BC,OAAwB,EACL;IACnB,MAAMC,eAAyB,GAAG,CAAC,IAAI,CAACN,sBAAsB,CAAC;IAC/D,IAAIK,OAAO,CAACE,QAAQ,EAAE;MACpB,MAAMC,aAAa,GAAG,MAAM,IAAI,CAAC9B,eAAe,CAACuB,SAAS,CACxD,KAAKI,OAAO,CAACE,QAAQ,IACvB,CAAC;MACD,MAAME,SAAS,GAAG,MAAM,IAAI,CAAC/B,eAAe,CAACuB,SAAS,CAAC,gBAAgB,CAAC;MACxEK,eAAe,CAACI,IAAI,CAACF,aAAa,CAAC;MACnCF,eAAe,CAACI,IAAI,CAACD,SAAS,CAAC;IACjC;IACAH,eAAe,CAACI,IAAI,CAAC,IAAI,CAACP,mBAAmB,CAAC;IAC9C,OAAOG,eAAe;EACxB;EAEA,MAAcK,QAAQA,CACpBC,KAAe,EACfC,WAAmB,EACnBR,OAAwB,EAIvB;IACD,MAAM,IAAI,CAACS,MAAM,CAAC,IAAIC,YAAY,CAACH,KAAK,CAAC,CAAC;IAC1C,MAAMN,eAAe,GAAG,MAAM,IAAI,CAACF,kBAAkB,CAACC,OAAO,CAAC;IAC9D,MAAMW,YAAY,GAAG,CAAC,GAAGV,eAAe,CAAC;IACzC,MAAMW,MAAgB,GAAG,EAAE;IAE3B,OAAOD,YAAY,CAACE,MAAM,IAAI,IAAI,CAACtC,eAAe,EAAE;MAClD,MAAMuC,MAAM,GAAG,IAAI,CAACC,sBAAsB,CACxCC,KAAK,CAACC,IAAI,CAAC,MAAM,IAAI,CAACC,MAAM,CAACP,YAAY,CAAC,CAAC,EAC3CH,WAAW,KAAK,CAAC,GAAG,CAAC,GAAGA,WAC1B,CAAC;MACD,MAAMW,WAAW,GACfX,WAAW,KAAK,CAAC,GACbM,MAAM,CAACM,OAAO,CAACC,IAAI,CAACC,GAAG,CAAC,GAAGR,MAAM,CAAC,CAAC,GACnC,IAAI,CAACS,sBAAsB,CAACT,MAAM,CAAC;MACzC,MAAMU,aAAa,GAAGV,MAAM,CAACK,WAAW,CAAE;MAC1CR,YAAY,CAACN,IAAI,CAACc,WAAW,CAAC;MAC9BP,MAAM,CAACP,IAAI,CAACmB,aAAa,CAAC;MAC1B,IAAIL,WAAW,KAAK,IAAI,CAACtB,cAAc,EAAE;QACvC;MACF;IACF;IAEA,OAAO;MACLc,YAAY,EAAEA,YAAY,CAACc,KAAK,CAACxB,eAAe,CAACY,MAAM,CAAC;MACxDD,MAAM,EAAEA,MAAM,CAACa,KAAK,CAACxB,eAAe,CAACY,MAAM;IAC7C,CAAC;EACH;EAEQE,sBAAsBA,CAACD,MAAgB,EAAEN,WAAW,GAAG,GAAG,EAAE;IAClE,MAAMc,GAAG,GAAGD,IAAI,CAACC,GAAG,CAAC,GAAGR,MAAM,CAAC;IAC/B,MAAMY,IAAI,GAAGZ,MAAM,CAACa,GAAG,CAAEC,KAAK,IAAKP,IAAI,CAACQ,GAAG,CAAC,CAACD,KAAK,GAAGN,GAAG,IAAId,WAAW,CAAC,CAAC;IACzE,MAAMsB,GAAG,GAAGJ,IAAI,CAACK,MAAM,CAAC,CAACC,CAAC,EAAEC,CAAC,KAAKD,CAAC,GAAGC,CAAC,EAAE,CAAC,CAAC;IAC3C,OAAOP,IAAI,CAACC,GAAG,CAAEE,GAAG,IAAKA,GAAG,GAAGC,GAAG,CAAC;EACrC;EAEQP,sBAAsBA,CAACW,KAAe,EAAU;IACtD,MAAMC,CAAC,GAAGd,IAAI,CAACe,MAAM,CAAC,CAAC;IACvB,IAAIC,UAAU,GAAG,CAAC;IAClB,KAAK,IAAIC,CAAC,GAAG,CAAC,EAAEA,CAAC,GAAGJ,KAAK,CAACrB,MAAM,EAAEyB,CAAC,EAAE,EAAE;MACrCD,UAAU,IAAIH,KAAK,CAACI,CAAC,CAAE;MACvB,IAAIH,CAAC,GAAGE,UAAU,EAAE;QAClB,OAAOC,CAAC;MACV;IACF;IACA,OAAOJ,KAAK,CAACrB,MAAM,GAAG,CAAC;EACzB;EAEA,MAAc0B,oBAAoBA,CAChChC,KAAe,EACfP,OAAwB,EACxB;IACA,MAAMwC,YAAY,GAAG,CAAC,GAAG,EAAE,GAAG,EAAE,GAAG,EAAE,GAAG,EAAE,GAAG,EAAE,GAAG,CAAC;IACnD,IAAIC,eAAyB,GAAG,EAAE;IAElC,KAAK,MAAMjC,WAAW,IAAIgC,YAAY,EAAE;MACtC,MAAME,MAAM,GAAG,MAAM,IAAI,CAACpC,QAAQ,CAACC,KAAK,EAAEC,WAAW,EAAER,OAAO,CAAC;MAC/D,MAAM2C,MAAM,GAAGD,MAAM,CAAC/B,YAAY;MAClC,MAAMC,MAAM,GAAG8B,MAAM,CAAC9B,MAAM;MAE5B,MAAMgC,MAAM,GAAGD,MAAM,CAAC9B,MAAM;MAC5B,MAAMgC,UAAU,GAAGjC,MAAM,CAACmB,MAAM,CAC9B,CAACe,GAAG,EAAEC,KAAK,KAAKD,GAAG,GAAGzB,IAAI,CAAC2B,GAAG,CAACD,KAAK,CAAC,EACrC,CACF,CAAC;MACD,MAAME,UAAU,GAAGJ,UAAU,GAAGD,MAAM;MAEtC,IAAIK,UAAU,IAAI,CAAC,GAAG,EAAE;QACtBR,eAAe,GAAGE,MAAM;QACxB;MACF;IACF;IAEA,OAAO,IAAI,CAACO,4BAA4B,CAACT,eAAe,EAAElC,KAAK,CAAC;EAClE;EAEA,MAAc2C,4BAA4BA,CACxCT,eAAyB,EACzBlC,KAAe,EACK;IACpB,MAAM4C,QAAmB,GAAG,EAAE;IAE9B,IAAIR,MAAgB,GAAG,EAAE;IACzB,IAAIS,aAAa,GAAG,IAAI,CAACtD,mBAAmB;IAC5C,KAAK,IAAIwC,CAAC,GAAG,CAAC,EAAEA,CAAC,GAAGG,eAAe,CAAC5B,MAAM,EAAEyB,CAAC,EAAE,EAAE;MAC/C,IAAIG,eAAe,CAACH,CAAC,CAAC,GAAI,IAAI,CAACxC,mBAAmB,EAAE;QAClD6C,MAAM,CAACtC,IAAI,CAACoC,eAAe,CAACH,CAAC,CAAE,CAAC;MAClC;MAEA,IACEA,CAAC,GAAG,CAAC,IACLG,eAAe,CAACH,CAAC,GAAG,CAAC,CAAC,IAAK,IAAI,CAACxC,mBAAmB,IACnD2C,eAAe,CAACH,CAAC,CAAC,IAAK,IAAI,CAACxC,mBAAmB,EAC/C;QACA,MAAMuD,KAAK,GAAGD,aAAa;QAC3B,MAAME,GAAG,GAAGb,eAAe,CAACH,CAAC,GAAG,CAAC,CAAE;QACnC,MAAMiB,WAAW,GAAG,MAAM,IAAI,CAACC,4BAA4B,CACzDb,MAAM,EACNU,KAAK,EACLC,GACF,CAAC;QACDH,QAAQ,CAAC9C,IAAI,CAAC;UACZoD,KAAK,EAAEF;QACT,CAAC,CAAC;QACFZ,MAAM,GAAG,EAAE;QACXS,aAAa,GAAGX,eAAe,CAACH,CAAC,CAAE;MACrC;IACF;IAEA,MAAMe,KAAK,GAAGD,aAAa;IAC3B,MAAME,GAAG,GAAGb,eAAe,CAACiB,EAAE,CAAC,CAAC,CAAC,CAAE;IACnC,MAAMH,WAAW,GAAG,MAAM,IAAI,CAACC,4BAA4B,CACzDb,MAAM,EACNU,KAAK,EACLC,GACF,CAAC;IACDH,QAAQ,CAAC9C,IAAI,CAAC;MACZoD,KAAK,EAAEF;IACT,CAAC,CAAC;IAEF,MAAMI,aAAa,GACjBpD,KAAK,CAACM,MAAM,GACZ,IAAI,CAACnC,YAAY,IAChB,CAAC4E,GAAG,GAAG,IAAI,CAACxD,mBAAmB,IAAI,IAAI,CAACxB,aAAa,CAAC;IACzD,IAAIqF,aAAa,GAAG,CAAC,EAAE;MACrB,KAAK,MAAMC,OAAO,IAAIT,QAAQ,EAAE;QAC9B,KAAK,MAAMU,IAAI,IAAID,OAAO,CAACH,KAAK,EAAE;UAChCI,IAAI,CAACR,KAAK,IAAIM,aAAa;UAC3BE,IAAI,CAACP,GAAG,IAAIK,aAAa;QAC3B;MACF;IACF;IAEA,OAAOR,QAAQ;EACjB;EAEA,MAAcK,4BAA4BA,CACxCb,MAAgB,EAChBU,KAAa,EACbC,GAAW,EACY;IACvB,MAAMQ,QAAQ,GAAG,CAACR,GAAG,GAAGD,KAAK,IAAI,IAAI,CAAC/E,aAAa;IACnD,MAAMyF,WAAW,GAAG,CACjB,MAAM,IAAI,CAAC1F,eAAe,CAAC6C,MAAM,CAACyB,MAAM,CAAC,EAC1CqB,IAAI,CAAC,CAAC;IAER,MAAMP,KAAK,GAAGM,WAAW,CAACE,KAAK,CAAC,GAAG,CAAC,CAACtC,GAAG,CAAEuC,CAAC,IAAK,IAAIA,CAAC,EAAE,CAAC;IACxD,MAAMC,eAAe,GAAGV,KAAK,CAAC1B,MAAM,CAClC,CAACe,GAAW,EAAEe,IAAY,KAAKf,GAAG,GAAGe,IAAI,CAAChD,MAAM,EAChD,CACF,CAAC;IAED,MAAMuD,gBAAgB,GAAGN,QAAQ,GAAGK,eAAe;IAEnD,MAAMZ,WAAyB,GAAG,EAAE;IACpC,MAAMc,eAAe,GACnB,CAAChB,KAAK,GAAG,IAAI,CAACvD,mBAAmB,IAAI,IAAI,CAACxB,aAAa;IAEzD,IAAIgG,WAAW,GAAG,CAAC;IACnB,KAAK,IAAIC,CAAC,GAAG,CAAC,EAAEA,CAAC,GAAGd,KAAK,CAAC5C,MAAM,EAAE0D,CAAC,EAAE,EAAE;MACrC,MAAMV,IAAI,GAAGJ,KAAK,CAACc,CAAC,CAAE;MACtB,MAAMlB,KAAK,GAAGgB,eAAe,GAAGC,WAAW,GAAGF,gBAAgB;MAC9D,MAAMd,GAAG,GAAGD,KAAK,GAAGe,gBAAgB,GAAGP,IAAI,CAAChD,MAAM;MAClD0C,WAAW,CAAClD,IAAI,CAAC;QAAEwD,IAAI;QAAER,KAAK;QAAEC;MAAI,CAAC,CAAC;MACtCgB,WAAW,IAAIT,IAAI,CAAChD,MAAM;IAC5B;IAEA,OAAO0C,WAAW;EACpB;EAEA,MAAaiB,UAAUA,CACrBjE,KAAe,EACfP,OAAwB,EACJ;IACpB,IAAIyE,IAAI,GAAG,CAAC;IACZ,MAAMC,WAAsB,GAAG,EAAE;IAEjC,OAAOD,IAAI,GAAG,IAAI,CAAC/F,YAAY,GAAG6B,KAAK,CAACM,MAAM,EAAE;MAC9C,MAAM8D,KAAK,GAAGpE,KAAK,CAACkB,KAAK,CACvBgD,IAAI,GAAG,IAAI,CAAC/F,YAAY,EACxB,CAAC+F,IAAI,GAAG,IAAI,CAACjG,SAAS,IAAI,IAAI,CAACE,YACjC,CAAC;MACD,IAAIiG,KAAK,CAAC9D,MAAM,GAAG,IAAI,CAACpC,eAAe,EAAE;QACvC,OAAOiG,WAAW;MACpB;MACA,MAAMvB,QAAQ,GAAG,MAAM,IAAI,CAACZ,oBAAoB,CAACoC,KAAK,EAAE3E,OAAO,CAAC;MAChE,KAAK,MAAM4D,OAAO,IAAIT,QAAQ,EAAE;QAC9B,KAAK,MAAMU,IAAI,IAAID,OAAO,CAACH,KAAK,EAAE;UAChCI,IAAI,CAACR,KAAK,IAAIoB,IAAI;UAClBZ,IAAI,CAACP,GAAG,IAAImB,IAAI;QAClB;MACF;MACAC,WAAW,CAACrE,IAAI,CAAC,GAAG8C,QAAQ,CAAC;MAC7B,MAAMyB,aAAa,GAAGzB,QAAQ,CAACO,EAAE,CAAC,CAAC,CAAC,CAAC,CAAED,KAAK,CAACC,EAAE,CAAC,CAAC,CAAC,CAAC,CAAEJ,GAAG;MACxDmB,IAAI,GAAGG,aAAa;IACtB;IAEA,OAAOF,WAAW;EACpB;EAEOG,OAAOA,CAAC1B,QAAmB,EAAe;IAC/C,MAAM2B,CAAc,GAAG,EAAE;IACzB,KAAK,MAAMlB,OAAO,IAAIT,QAAQ,EAAE;MAC9B,KAAK,MAAMU,IAAI,IAAID,OAAO,CAACH,KAAK,EAAE;QAChCqB,CAAC,CAACzE,IAAI,CAAC,CAACwD,IAAI,CAACR,KAAK,EAAEQ,IAAI,CAACP,GAAG,EAAEO,IAAI,CAACA,IAAI,CAAC,CAAC;MAC3C;IACF;IACA,OAAOiB,CAAC;EACV;EAEOC,aAAaA,CAACC,GAAc,EAAE;IACnC,OAAOA,GAAG,CAACrD,GAAG,CAAEiC,OAAO,IAAKA,OAAO,CAACH,KAAK,CAACC,EAAE,CAAC,CAAC,CAAC,CAAC,CAAEJ,GAAG,CAAC;EACxD;EAEA,MAAa7C,MAAMA,CAACwE,QAAsB,EAAiB;IACzD,MAAM,IAAI,CAACzF,YAAY,CAACiB,MAAM,CAACwE,QAAQ,CAAC;EAC1C;EAEA,MAAa/D,MAAMA,CAACyB,MAAgB,EAAyB;IAC3D,OAAO,IAAIjC,YAAY,CAAC,MAAM,IAAI,CAAClB,YAAY,CAAC0B,MAAM,CAACyB,MAAM,CAAC,CAAC;EACjE;AACF","ignoreList":[]}
|
|
@@ -0,0 +1,73 @@
|
|
|
1
|
+
"use strict";
|
|
2
|
+
|
|
3
|
+
// NOTE: This will be implemented in C++
|
|
4
|
+
|
|
5
|
+
import { HypothesisBuffer } from './hypothesisBuffer';
|
|
6
|
+
export class OnlineASRProcessor {
|
|
7
|
+
samplingRate = 16000;
|
|
8
|
+
audioBuffer = [];
|
|
9
|
+
transcriptBuffer = new HypothesisBuffer();
|
|
10
|
+
bufferTimeOffset = 0;
|
|
11
|
+
committed = [];
|
|
12
|
+
constructor(asr) {
|
|
13
|
+
this.asr = asr;
|
|
14
|
+
}
|
|
15
|
+
insertAudioChunk(audio) {
|
|
16
|
+
this.audioBuffer.push(...audio);
|
|
17
|
+
}
|
|
18
|
+
async processIter(options) {
|
|
19
|
+
const res = await this.asr.transcribe(this.audioBuffer, options);
|
|
20
|
+
const tsw = this.asr.tsWords(res);
|
|
21
|
+
this.transcriptBuffer.insert(tsw, this.bufferTimeOffset);
|
|
22
|
+
const o = this.transcriptBuffer.flush();
|
|
23
|
+
this.committed.push(...o);
|
|
24
|
+
const s = 15;
|
|
25
|
+
if (this.audioBuffer.length / this.samplingRate > s) {
|
|
26
|
+
this.chunkCompletedSegment(res);
|
|
27
|
+
}
|
|
28
|
+
const committed = this.toFlush(o)[2];
|
|
29
|
+
const nonCommitted = this.transcriptBuffer.complete().map(x => x[2]).join('');
|
|
30
|
+
return {
|
|
31
|
+
committed,
|
|
32
|
+
nonCommitted
|
|
33
|
+
};
|
|
34
|
+
}
|
|
35
|
+
chunkCompletedSegment(res) {
|
|
36
|
+
if (this.committed.length === 0) {
|
|
37
|
+
return;
|
|
38
|
+
}
|
|
39
|
+
const ends = this.asr.segmentsEndTs(res);
|
|
40
|
+
const t = this.committed.at(-1)[1];
|
|
41
|
+
if (ends.length > 1) {
|
|
42
|
+
let e = ends.at(-2) + this.bufferTimeOffset;
|
|
43
|
+
while (ends.length > 2 && e > t) {
|
|
44
|
+
ends.pop();
|
|
45
|
+
e = ends.at(-2) + this.bufferTimeOffset;
|
|
46
|
+
}
|
|
47
|
+
if (e <= t) {
|
|
48
|
+
this.chunkAt(e);
|
|
49
|
+
}
|
|
50
|
+
}
|
|
51
|
+
}
|
|
52
|
+
chunkAt(time) {
|
|
53
|
+
this.transcriptBuffer.popCommitted(time);
|
|
54
|
+
const cutSeconds = time - this.bufferTimeOffset;
|
|
55
|
+
this.audioBuffer = this.audioBuffer.slice(Math.floor(cutSeconds * this.samplingRate));
|
|
56
|
+
this.bufferTimeOffset = time;
|
|
57
|
+
}
|
|
58
|
+
async finish() {
|
|
59
|
+
const o = this.transcriptBuffer.complete();
|
|
60
|
+
const f = this.toFlush(o);
|
|
61
|
+
this.bufferTimeOffset += this.audioBuffer.length / this.samplingRate;
|
|
62
|
+
return {
|
|
63
|
+
committed: f[2]
|
|
64
|
+
};
|
|
65
|
+
}
|
|
66
|
+
toFlush(words) {
|
|
67
|
+
const t = words.map(s => s[2]).join(' ');
|
|
68
|
+
const b = words.length === 0 ? null : words[0][0];
|
|
69
|
+
const e = words.length === 0 ? null : words.at(-1)[1];
|
|
70
|
+
return [b, e, t];
|
|
71
|
+
}
|
|
72
|
+
}
|
|
73
|
+
//# sourceMappingURL=OnlineProcessor.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"names":["HypothesisBuffer","OnlineASRProcessor","samplingRate","audioBuffer","transcriptBuffer","bufferTimeOffset","committed","constructor","asr","insertAudioChunk","audio","push","processIter","options","res","transcribe","tsw","tsWords","insert","o","flush","s","length","chunkCompletedSegment","toFlush","nonCommitted","complete","map","x","join","ends","segmentsEndTs","t","at","e","pop","chunkAt","time","popCommitted","cutSeconds","slice","Math","floor","finish","f","words","b"],"sourceRoot":"../../../../src","sources":["utils/SpeechToTextModule/OnlineProcessor.ts"],"mappings":";;AAAA;;AAIA,SAASA,gBAAgB,QAAQ,oBAAoB;AAErD,OAAO,MAAMC,kBAAkB,CAAC;EAGtBC,YAAY,GAAW,KAAK;EAC7BC,WAAW,GAAa,EAAE;EACzBC,gBAAgB,GAAqB,IAAIJ,gBAAgB,CAAC,CAAC;EAC3DK,gBAAgB,GAAW,CAAC;EAC5BC,SAAS,GAAgB,EAAE;EAEnCC,WAAWA,CAACC,GAAQ,EAAE;IACpB,IAAI,CAACA,GAAG,GAAGA,GAAG;EAChB;EAEOC,gBAAgBA,CAACC,KAAe,EAAE;IACvC,IAAI,CAACP,WAAW,CAACQ,IAAI,CAAC,GAAGD,KAAK,CAAC;EACjC;EAEA,MAAaE,WAAWA,CAACC,OAAwB,EAAE;IACjD,MAAMC,GAAG,GAAG,MAAM,IAAI,CAACN,GAAG,CAACO,UAAU,CAAC,IAAI,CAACZ,WAAW,EAAEU,OAAO,CAAC;IAChE,MAAMG,GAAG,GAAG,IAAI,CAACR,GAAG,CAACS,OAAO,CAACH,GAAG,CAAC;IACjC,IAAI,CAACV,gBAAgB,CAACc,MAAM,CAACF,GAAG,EAAE,IAAI,CAACX,gBAAgB,CAAC;IACxD,MAAMc,CAAC,GAAG,IAAI,CAACf,gBAAgB,CAACgB,KAAK,CAAC,CAAC;IACvC,IAAI,CAACd,SAAS,CAACK,IAAI,CAAC,GAAGQ,CAAC,CAAC;IAEzB,MAAME,CAAC,GAAG,EAAE;IACZ,IAAI,IAAI,CAAClB,WAAW,CAACmB,MAAM,GAAG,IAAI,CAACpB,YAAY,GAAGmB,CAAC,EAAE;MACnD,IAAI,CAACE,qBAAqB,CAACT,GAAG,CAAC;IACjC;IAEA,MAAMR,SAAS,GAAG,IAAI,CAACkB,OAAO,CAACL,CAAC,CAAC,CAAC,CAAC,CAAC;IACpC,MAAMM,YAAY,GAAG,IAAI,CAACrB,gBAAgB,CACvCsB,QAAQ,CAAC,CAAC,CACVC,GAAG,CAAEC,CAAC,IAAKA,CAAC,CAAC,CAAC,CAAC,CAAC,CAChBC,IAAI,CAAC,EAAE,CAAC;IACX,OAAO;MAAEvB,SAAS;MAAEmB;IAAa,CAAC;EACpC;EAEQF,qBAAqBA,CAACT,GAAc,EAAE;IAC5C,IAAI,IAAI,CAACR,SAAS,CAACgB,MAAM,KAAK,CAAC,EAAE;MAC/B;IACF;IAEA,MAAMQ,IAAI,GAAG,IAAI,CAACtB,GAAG,CAACuB,aAAa,CAACjB,GAAG,CAAC;IACxC,MAAMkB,CAAC,GAAG,IAAI,CAAC1B,SAAS,CAAC2B,EAAE,CAAC,CAAC,CAAC,CAAC,CAAE,CAAC,CAAC;IAEnC,IAAIH,IAAI,CAACR,MAAM,GAAG,CAAC,EAAE;MACnB,IAAIY,CAAC,GAAGJ,IAAI,CAACG,EAAE,CAAC,CAAC,CAAC,CAAC,GAAI,IAAI,CAAC5B,gBAAgB;MAC5C,OAAOyB,IAAI,CAACR,MAAM,GAAG,CAAC,IAAIY,CAAC,GAAGF,CAAC,EAAE;QAC/BF,IAAI,CAACK,GAAG,CAAC,CAAC;QACVD,CAAC,GAAGJ,IAAI,CAACG,EAAE,CAAC,CAAC,CAAC,CAAC,GAAI,IAAI,CAAC5B,gBAAgB;MAC1C;MAEA,IAAI6B,CAAC,IAAIF,CAAC,EAAE;QACV,IAAI,CAACI,OAAO,CAACF,CAAC,CAAC;MACjB;IACF;EACF;EAEQE,OAAOA,CAACC,IAAY,EAAE;IAC5B,IAAI,CAACjC,gBAAgB,CAACkC,YAAY,CAACD,IAAI,CAAC;IACxC,MAAME,UAAU,GAAGF,IAAI,GAAG,IAAI,CAAChC,gBAAgB;IAC/C,IAAI,CAACF,WAAW,GAAG,IAAI,CAACA,WAAW,CAACqC,KAAK,CACvCC,IAAI,CAACC,KAAK,CAACH,UAAU,GAAG,IAAI,CAACrC,YAAY,CAC3C,CAAC;IACD,IAAI,CAACG,gBAAgB,GAAGgC,IAAI;EAC9B;EAEA,MAAaM,MAAMA,CAAA,EAAG;IACpB,MAAMxB,CAAC,GAAG,IAAI,CAACf,gBAAgB,CAACsB,QAAQ,CAAC,CAAC;IAC1C,MAAMkB,CAAC,GAAG,IAAI,CAACpB,OAAO,CAACL,CAAC,CAAC;IACzB,IAAI,CAACd,gBAAgB,IAAI,IAAI,CAACF,WAAW,CAACmB,MAAM,GAAG,IAAI,CAACpB,YAAY;IACpE,OAAO;MAAEI,SAAS,EAAEsC,CAAC,CAAC,CAAC;IAAE,CAAC;EAC5B;EAEQpB,OAAOA,CAACqB,KAAkB,EAA0C;IAC1E,MAAMb,CAAC,GAAGa,KAAK,CAAClB,GAAG,CAAEN,CAAC,IAAKA,CAAC,CAAC,CAAC,CAAC,CAAC,CAACQ,IAAI,CAAC,GAAG,CAAC;IAC1C,MAAMiB,CAAC,GAAGD,KAAK,CAACvB,MAAM,KAAK,CAAC,GAAG,IAAI,GAAGuB,KAAK,CAAC,CAAC,CAAC,CAAE,CAAC,CAAC;IAClD,MAAMX,CAAC,GAAGW,KAAK,CAACvB,MAAM,KAAK,CAAC,GAAG,IAAI,GAAGuB,KAAK,CAACZ,EAAE,CAAC,CAAC,CAAC,CAAC,CAAE,CAAC,CAAC;IACtD,OAAO,CAACa,CAAC,EAAEZ,CAAC,EAAEF,CAAC,CAAC;EAClB;AACF","ignoreList":[]}
|
|
@@ -0,0 +1,56 @@
|
|
|
1
|
+
"use strict";
|
|
2
|
+
|
|
3
|
+
// NOTE: This will be implemented in C++
|
|
4
|
+
|
|
5
|
+
export class HypothesisBuffer {
|
|
6
|
+
committedInBuffer = [];
|
|
7
|
+
buffer = [];
|
|
8
|
+
new = [];
|
|
9
|
+
lastCommittedTime = 0;
|
|
10
|
+
lastCommittedWord = null;
|
|
11
|
+
insert(newWords, offset) {
|
|
12
|
+
const newWordsOffset = newWords.map(([a, b, t]) => [a + offset, b + offset, t]);
|
|
13
|
+
this.new = newWordsOffset.filter(([a, _b, _t]) => a > this.lastCommittedTime - 0.5);
|
|
14
|
+
if (this.new.length > 0) {
|
|
15
|
+
const [a, _b, _t] = this.new[0];
|
|
16
|
+
if (Math.abs(a - this.lastCommittedTime) < 1 && this.committedInBuffer.length > 0) {
|
|
17
|
+
const cn = this.committedInBuffer.length;
|
|
18
|
+
const nn = this.new.length;
|
|
19
|
+
for (let i = 1; i <= Math.min(cn, nn, 5); i++) {
|
|
20
|
+
const c = this.committedInBuffer.slice(-i).map(w => w[2]).join(' ');
|
|
21
|
+
const tail = this.new.slice(0, i).map(w => w[2]).join(' ');
|
|
22
|
+
if (c === tail) {
|
|
23
|
+
for (let j = 0; j < i; j++) {
|
|
24
|
+
this.new.shift();
|
|
25
|
+
}
|
|
26
|
+
break;
|
|
27
|
+
}
|
|
28
|
+
}
|
|
29
|
+
}
|
|
30
|
+
}
|
|
31
|
+
}
|
|
32
|
+
flush() {
|
|
33
|
+
const commit = [];
|
|
34
|
+
while (this.new.length > 0 && this.buffer.length > 0) {
|
|
35
|
+
if (this.new[0][2] !== this.buffer[0][2]) {
|
|
36
|
+
break;
|
|
37
|
+
}
|
|
38
|
+
commit.push(this.new[0]);
|
|
39
|
+
this.lastCommittedWord = this.new[0][2];
|
|
40
|
+
this.lastCommittedTime = this.new[0][1];
|
|
41
|
+
this.buffer.shift();
|
|
42
|
+
this.new.shift();
|
|
43
|
+
}
|
|
44
|
+
this.buffer = this.new;
|
|
45
|
+
this.new = [];
|
|
46
|
+
this.committedInBuffer.push(...commit);
|
|
47
|
+
return commit;
|
|
48
|
+
}
|
|
49
|
+
popCommitted(time) {
|
|
50
|
+
this.committedInBuffer = this.committedInBuffer.filter(([_a, b, _t]) => b > time);
|
|
51
|
+
}
|
|
52
|
+
complete() {
|
|
53
|
+
return this.buffer;
|
|
54
|
+
}
|
|
55
|
+
}
|
|
56
|
+
//# sourceMappingURL=hypothesisBuffer.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"names":["HypothesisBuffer","committedInBuffer","buffer","new","lastCommittedTime","lastCommittedWord","insert","newWords","offset","newWordsOffset","map","a","b","t","filter","_b","_t","length","Math","abs","cn","nn","i","min","c","slice","w","join","tail","j","shift","flush","commit","push","popCommitted","time","_a","complete"],"sourceRoot":"../../../../src","sources":["utils/SpeechToTextModule/hypothesisBuffer.ts"],"mappings":";;AAAA;;AAIA,OAAO,MAAMA,gBAAgB,CAAC;EACpBC,iBAAiB,GAAgB,EAAE;EACnCC,MAAM,GAAgB,EAAE;EACxBC,GAAG,GAAgB,EAAE;EAErBC,iBAAiB,GAAW,CAAC;EAC9BC,iBAAiB,GAAkB,IAAI;EAEvCC,MAAMA,CAACC,QAAqB,EAAEC,MAAc,EAAE;IACnD,MAAMC,cAA2B,GAAGF,QAAQ,CAACG,GAAG,CAAC,CAAC,CAACC,CAAC,EAAEC,CAAC,EAAEC,CAAC,CAAC,KAAK,CAC9DF,CAAC,GAAGH,MAAM,EACVI,CAAC,GAAGJ,MAAM,EACVK,CAAC,CACF,CAAC;IACF,IAAI,CAACV,GAAG,GAAGM,cAAc,CAACK,MAAM,CAC9B,CAAC,CAACH,CAAC,EAAEI,EAAE,EAAEC,EAAE,CAAC,KAAKL,CAAC,GAAG,IAAI,CAACP,iBAAiB,GAAG,GAChD,CAAC;IAED,IAAI,IAAI,CAACD,GAAG,CAACc,MAAM,GAAG,CAAC,EAAE;MACvB,MAAM,CAACN,CAAC,EAAEI,EAAE,EAAEC,EAAE,CAAC,GAAG,IAAI,CAACb,GAAG,CAAC,CAAC,CAAE;MAChC,IACEe,IAAI,CAACC,GAAG,CAACR,CAAC,GAAG,IAAI,CAACP,iBAAiB,CAAC,GAAG,CAAC,IACxC,IAAI,CAACH,iBAAiB,CAACgB,MAAM,GAAG,CAAC,EACjC;QACA,MAAMG,EAAE,GAAG,IAAI,CAACnB,iBAAiB,CAACgB,MAAM;QACxC,MAAMI,EAAE,GAAG,IAAI,CAAClB,GAAG,CAACc,MAAM;QAE1B,KAAK,IAAIK,CAAC,GAAG,CAAC,EAAEA,CAAC,IAAIJ,IAAI,CAACK,GAAG,CAACH,EAAE,EAAEC,EAAE,EAAE,CAAC,CAAC,EAAEC,CAAC,EAAE,EAAE;UAC7C,MAAME,CAAC,GAAG,IAAI,CAACvB,iBAAiB,CAC7BwB,KAAK,CAAC,CAACH,CAAC,CAAC,CACTZ,GAAG,CAAEgB,CAAC,IAAKA,CAAC,CAAC,CAAC,CAAC,CAAC,CAChBC,IAAI,CAAC,GAAG,CAAC;UACZ,MAAMC,IAAI,GAAG,IAAI,CAACzB,GAAG,CAClBsB,KAAK,CAAC,CAAC,EAAEH,CAAC,CAAC,CACXZ,GAAG,CAAEgB,CAAC,IAAKA,CAAC,CAAC,CAAC,CAAC,CAAC,CAChBC,IAAI,CAAC,GAAG,CAAC;UACZ,IAAIH,CAAC,KAAKI,IAAI,EAAE;YACd,KAAK,IAAIC,CAAC,GAAG,CAAC,EAAEA,CAAC,GAAGP,CAAC,EAAEO,CAAC,EAAE,EAAE;cAC1B,IAAI,CAAC1B,GAAG,CAAC2B,KAAK,CAAC,CAAC;YAClB;YACA;UACF;QACF;MACF;IACF;EACF;EAEOC,KAAKA,CAAA,EAAgB;IAC1B,MAAMC,MAAmB,GAAG,EAAE;IAC9B,OAAO,IAAI,CAAC7B,GAAG,CAACc,MAAM,GAAG,CAAC,IAAI,IAAI,CAACf,MAAM,CAACe,MAAM,GAAG,CAAC,EAAE;MACpD,IAAI,IAAI,CAACd,GAAG,CAAC,CAAC,CAAC,CAAE,CAAC,CAAC,KAAK,IAAI,CAACD,MAAM,CAAC,CAAC,CAAC,CAAE,CAAC,CAAC,EAAE;QAC1C;MACF;MACA8B,MAAM,CAACC,IAAI,CAAC,IAAI,CAAC9B,GAAG,CAAC,CAAC,CAAE,CAAC;MACzB,IAAI,CAACE,iBAAiB,GAAG,IAAI,CAACF,GAAG,CAAC,CAAC,CAAC,CAAE,CAAC,CAAC;MACxC,IAAI,CAACC,iBAAiB,GAAG,IAAI,CAACD,GAAG,CAAC,CAAC,CAAC,CAAE,CAAC,CAAC;MACxC,IAAI,CAACD,MAAM,CAAC4B,KAAK,CAAC,CAAC;MACnB,IAAI,CAAC3B,GAAG,CAAC2B,KAAK,CAAC,CAAC;IAClB;IACA,IAAI,CAAC5B,MAAM,GAAG,IAAI,CAACC,GAAG;IACtB,IAAI,CAACA,GAAG,GAAG,EAAE;IACb,IAAI,CAACF,iBAAiB,CAACgC,IAAI,CAAC,GAAGD,MAAM,CAAC;IACtC,OAAOA,MAAM;EACf;EAEOE,YAAYA,CAACC,IAAY,EAAE;IAChC,IAAI,CAAClC,iBAAiB,GAAG,IAAI,CAACA,iBAAiB,CAACa,MAAM,CACpD,CAAC,CAACsB,EAAE,EAAExB,CAAC,EAAEI,EAAE,CAAC,KAAKJ,CAAC,GAAGuB,IACvB,CAAC;EACH;EAEOE,QAAQA,CAAA,EAAgB;IAC7B,OAAO,IAAI,CAACnC,MAAM;EACpB;AACF","ignoreList":[]}
|
|
@@ -0,0 +1,8 @@
|
|
|
1
|
+
import { ResourceSource } from '../types/common';
|
|
2
|
+
export declare class BaseModule {
|
|
3
|
+
protected static nativeModule: any;
|
|
4
|
+
static onDownloadProgressCallback: (downloadProgress: number) => void;
|
|
5
|
+
static load(sources: ResourceSource[], ...loadArgs: any[]): Promise<void>;
|
|
6
|
+
protected static forward(..._args: any[]): Promise<any>;
|
|
7
|
+
static onDownloadProgress(callback: (downloadProgress: number) => void): void;
|
|
8
|
+
}
|
|
@@ -0,0 +1,25 @@
|
|
|
1
|
+
import { ResourceFetcher } from '../utils/ResourceFetcher';
|
|
2
|
+
import { getError } from '../Error';
|
|
3
|
+
export class BaseModule {
|
|
4
|
+
static nativeModule;
|
|
5
|
+
static onDownloadProgressCallback = () => { };
|
|
6
|
+
static async load(sources, ...loadArgs // this can be used in derived classes to pass extra args to load method
|
|
7
|
+
) {
|
|
8
|
+
try {
|
|
9
|
+
const paths = await ResourceFetcher.fetch(this.onDownloadProgressCallback, ...sources);
|
|
10
|
+
if (paths === null || paths.length < sources.length) {
|
|
11
|
+
throw new Error('Download interrupted.');
|
|
12
|
+
}
|
|
13
|
+
await this.nativeModule.loadModule(...paths, ...loadArgs);
|
|
14
|
+
}
|
|
15
|
+
catch (error) {
|
|
16
|
+
throw new Error(getError(error));
|
|
17
|
+
}
|
|
18
|
+
}
|
|
19
|
+
static async forward(..._args) {
|
|
20
|
+
throw new Error('forward method is not implemented in the BaseModule class. Please implement it in the derived class.');
|
|
21
|
+
}
|
|
22
|
+
static onDownloadProgress(callback) {
|
|
23
|
+
this.onDownloadProgressCallback = callback;
|
|
24
|
+
}
|
|
25
|
+
}
|
|
@@ -0,0 +1,9 @@
|
|
|
1
|
+
import { ResourceSource } from '../types/common';
|
|
2
|
+
import { TensorPtr } from '../types/common';
|
|
3
|
+
export declare abstract class BaseNonStaticModule {
|
|
4
|
+
nativeModule: any;
|
|
5
|
+
abstract load(modelSource: ResourceSource, onDownloadProgressCallback: (_: number) => void, ...args: any[]): Promise<void>;
|
|
6
|
+
protected forwardET(inputTensor: TensorPtr[]): Promise<TensorPtr[]>;
|
|
7
|
+
getInputShape(methodName: string, index: number): Promise<number[]>;
|
|
8
|
+
delete(): void;
|
|
9
|
+
}
|
|
@@ -0,0 +1,14 @@
|
|
|
1
|
+
export class BaseNonStaticModule {
|
|
2
|
+
nativeModule = null;
|
|
3
|
+
async forwardET(inputTensor) {
|
|
4
|
+
return await this.nativeModule.forward(inputTensor);
|
|
5
|
+
}
|
|
6
|
+
async getInputShape(methodName, index) {
|
|
7
|
+
return this.nativeModule.getInputShape(methodName, index);
|
|
8
|
+
}
|
|
9
|
+
delete() {
|
|
10
|
+
if (this.nativeModule !== null) {
|
|
11
|
+
this.nativeModule.unload();
|
|
12
|
+
}
|
|
13
|
+
}
|
|
14
|
+
}
|
|
@@ -0,0 +1,8 @@
|
|
|
1
|
+
import { ResourceSource } from '../../types/common';
|
|
2
|
+
import { BaseNonStaticModule } from '../BaseNonStaticModule';
|
|
3
|
+
export declare class ClassificationModule extends BaseNonStaticModule {
|
|
4
|
+
load(model: {
|
|
5
|
+
modelSource: ResourceSource;
|
|
6
|
+
}, onDownloadProgressCallback?: (progress: number) => void): Promise<void>;
|
|
7
|
+
forward(imageSource: string): Promise<any>;
|
|
8
|
+
}
|
|
@@ -0,0 +1,17 @@
|
|
|
1
|
+
import { ResourceFetcher } from '../../utils/ResourceFetcher';
|
|
2
|
+
import { ETError, getError } from '../../Error';
|
|
3
|
+
import { BaseNonStaticModule } from '../BaseNonStaticModule';
|
|
4
|
+
export class ClassificationModule extends BaseNonStaticModule {
|
|
5
|
+
async load(model, onDownloadProgressCallback = () => { }) {
|
|
6
|
+
const paths = await ResourceFetcher.fetch(onDownloadProgressCallback, model.modelSource);
|
|
7
|
+
if (paths === null || paths.length < 1) {
|
|
8
|
+
throw new Error('Download interrupted.');
|
|
9
|
+
}
|
|
10
|
+
this.nativeModule = global.loadClassification(paths[0] || '');
|
|
11
|
+
}
|
|
12
|
+
async forward(imageSource) {
|
|
13
|
+
if (this.nativeModule == null)
|
|
14
|
+
throw new Error(getError(ETError.ModuleNotLoaded));
|
|
15
|
+
return await this.nativeModule.generate(imageSource);
|
|
16
|
+
}
|
|
17
|
+
}
|
|
@@ -0,0 +1,8 @@
|
|
|
1
|
+
import { ResourceSource } from '../../types/common';
|
|
2
|
+
import { BaseNonStaticModule } from '../BaseNonStaticModule';
|
|
3
|
+
export declare class ImageEmbeddingsModule extends BaseNonStaticModule {
|
|
4
|
+
load(model: {
|
|
5
|
+
modelSource: ResourceSource;
|
|
6
|
+
}, onDownloadProgressCallback?: (progress: number) => void): Promise<void>;
|
|
7
|
+
forward(imageSource: string): Promise<Float32Array>;
|
|
8
|
+
}
|
|
@@ -0,0 +1,17 @@
|
|
|
1
|
+
import { ResourceFetcher } from '../../utils/ResourceFetcher';
|
|
2
|
+
import { ETError, getError } from '../../Error';
|
|
3
|
+
import { BaseNonStaticModule } from '../BaseNonStaticModule';
|
|
4
|
+
export class ImageEmbeddingsModule extends BaseNonStaticModule {
|
|
5
|
+
async load(model, onDownloadProgressCallback = () => { }) {
|
|
6
|
+
const paths = await ResourceFetcher.fetch(onDownloadProgressCallback, model.modelSource);
|
|
7
|
+
if (paths === null || paths.length < 1) {
|
|
8
|
+
throw new Error('Download interrupted.');
|
|
9
|
+
}
|
|
10
|
+
this.nativeModule = global.loadImageEmbeddings(paths[0] || '');
|
|
11
|
+
}
|
|
12
|
+
async forward(imageSource) {
|
|
13
|
+
if (this.nativeModule == null)
|
|
14
|
+
throw new Error(getError(ETError.ModuleNotLoaded));
|
|
15
|
+
return new Float32Array(await this.nativeModule.generate(imageSource));
|
|
16
|
+
}
|
|
17
|
+
}
|
|
@@ -0,0 +1,11 @@
|
|
|
1
|
+
import { ResourceSource } from '../../types/common';
|
|
2
|
+
import { DeeplabLabel } from '../../types/imageSegmentation';
|
|
3
|
+
import { BaseNonStaticModule } from '../BaseNonStaticModule';
|
|
4
|
+
export declare class ImageSegmentationModule extends BaseNonStaticModule {
|
|
5
|
+
load(model: {
|
|
6
|
+
modelSource: ResourceSource;
|
|
7
|
+
}, onDownloadProgressCallback?: (progress: number) => void): Promise<void>;
|
|
8
|
+
forward(imageSource: string, classesOfInterest?: DeeplabLabel[], resize?: boolean): Promise<{
|
|
9
|
+
[key in DeeplabLabel]?: number[];
|
|
10
|
+
}>;
|
|
11
|
+
}
|
|
@@ -0,0 +1,27 @@
|
|
|
1
|
+
import { ResourceFetcher } from '../../utils/ResourceFetcher';
|
|
2
|
+
import { DeeplabLabel } from '../../types/imageSegmentation';
|
|
3
|
+
import { ETError, getError } from '../../Error';
|
|
4
|
+
import { BaseNonStaticModule } from '../BaseNonStaticModule';
|
|
5
|
+
export class ImageSegmentationModule extends BaseNonStaticModule {
|
|
6
|
+
async load(model, onDownloadProgressCallback = () => { }) {
|
|
7
|
+
const paths = await ResourceFetcher.fetch(onDownloadProgressCallback, model.modelSource);
|
|
8
|
+
if (paths === null || paths.length < 1) {
|
|
9
|
+
throw new Error('Download interrupted.');
|
|
10
|
+
}
|
|
11
|
+
this.nativeModule = global.loadImageSegmentation(paths[0] || '');
|
|
12
|
+
}
|
|
13
|
+
async forward(imageSource, classesOfInterest, resize) {
|
|
14
|
+
if (this.nativeModule == null) {
|
|
15
|
+
throw new Error(getError(ETError.ModuleNotLoaded));
|
|
16
|
+
}
|
|
17
|
+
const stringDict = await this.nativeModule.generate(imageSource, (classesOfInterest || []).map((label) => DeeplabLabel[label]), resize || false);
|
|
18
|
+
let enumDict = {};
|
|
19
|
+
for (const key in stringDict) {
|
|
20
|
+
if (key in DeeplabLabel) {
|
|
21
|
+
const enumKey = DeeplabLabel[key];
|
|
22
|
+
enumDict[enumKey] = stringDict[key];
|
|
23
|
+
}
|
|
24
|
+
}
|
|
25
|
+
return enumDict;
|
|
26
|
+
}
|
|
27
|
+
}
|
|
@@ -0,0 +1,15 @@
|
|
|
1
|
+
import { ResourceSource } from '../../types/common';
|
|
2
|
+
import { OCRLanguage } from '../../types/ocr';
|
|
3
|
+
export declare class OCRModule {
|
|
4
|
+
private controller;
|
|
5
|
+
constructor();
|
|
6
|
+
load(model: {
|
|
7
|
+
detectorSource: ResourceSource;
|
|
8
|
+
recognizerLarge: ResourceSource;
|
|
9
|
+
recognizerMedium: ResourceSource;
|
|
10
|
+
recognizerSmall: ResourceSource;
|
|
11
|
+
language: OCRLanguage;
|
|
12
|
+
}, onDownloadProgressCallback?: (progress: number) => void): Promise<void>;
|
|
13
|
+
forward(input: string): Promise<any>;
|
|
14
|
+
delete(): void;
|
|
15
|
+
}
|
|
@@ -0,0 +1,20 @@
|
|
|
1
|
+
import { OCRController } from '../../controllers/OCRController';
|
|
2
|
+
export class OCRModule {
|
|
3
|
+
controller;
|
|
4
|
+
constructor() {
|
|
5
|
+
this.controller = new OCRController();
|
|
6
|
+
}
|
|
7
|
+
async load(model, onDownloadProgressCallback = () => { }) {
|
|
8
|
+
await this.controller.load(model.detectorSource, {
|
|
9
|
+
recognizerLarge: model.recognizerLarge,
|
|
10
|
+
recognizerMedium: model.recognizerMedium,
|
|
11
|
+
recognizerSmall: model.recognizerSmall,
|
|
12
|
+
}, model.language, onDownloadProgressCallback);
|
|
13
|
+
}
|
|
14
|
+
async forward(input) {
|
|
15
|
+
return await this.controller.forward(input);
|
|
16
|
+
}
|
|
17
|
+
delete() {
|
|
18
|
+
this.controller.delete();
|
|
19
|
+
}
|
|
20
|
+
}
|
|
@@ -0,0 +1,9 @@
|
|
|
1
|
+
import { ResourceSource } from '../../types/common';
|
|
2
|
+
import { Detection } from '../../types/objectDetection';
|
|
3
|
+
import { BaseNonStaticModule } from '../BaseNonStaticModule';
|
|
4
|
+
export declare class ObjectDetectionModule extends BaseNonStaticModule {
|
|
5
|
+
load(model: {
|
|
6
|
+
modelSource: ResourceSource;
|
|
7
|
+
}, onDownloadProgressCallback?: (progress: number) => void): Promise<void>;
|
|
8
|
+
forward(imageSource: string, detectionThreshold?: number): Promise<Detection[]>;
|
|
9
|
+
}
|
|
@@ -0,0 +1,17 @@
|
|
|
1
|
+
import { ResourceFetcher } from '../../utils/ResourceFetcher';
|
|
2
|
+
import { ETError, getError } from '../../Error';
|
|
3
|
+
import { BaseNonStaticModule } from '../BaseNonStaticModule';
|
|
4
|
+
export class ObjectDetectionModule extends BaseNonStaticModule {
|
|
5
|
+
async load(model, onDownloadProgressCallback = () => { }) {
|
|
6
|
+
const paths = await ResourceFetcher.fetch(onDownloadProgressCallback, model.modelSource);
|
|
7
|
+
if (paths === null || paths.length < 1) {
|
|
8
|
+
throw new Error('Download interrupted.');
|
|
9
|
+
}
|
|
10
|
+
this.nativeModule = global.loadObjectDetection(paths[0] || '');
|
|
11
|
+
}
|
|
12
|
+
async forward(imageSource, detectionThreshold = 0.7) {
|
|
13
|
+
if (this.nativeModule == null)
|
|
14
|
+
throw new Error(getError(ETError.ModuleNotLoaded));
|
|
15
|
+
return await this.nativeModule.generate(imageSource, detectionThreshold);
|
|
16
|
+
}
|
|
17
|
+
}
|
|
@@ -0,0 +1,8 @@
|
|
|
1
|
+
import { ResourceSource } from '../../types/common';
|
|
2
|
+
import { BaseNonStaticModule } from '../BaseNonStaticModule';
|
|
3
|
+
export declare class StyleTransferModule extends BaseNonStaticModule {
|
|
4
|
+
load(model: {
|
|
5
|
+
modelSource: ResourceSource;
|
|
6
|
+
}, onDownloadProgressCallback?: (progress: number) => void): Promise<void>;
|
|
7
|
+
forward(imageSource: string): Promise<string>;
|
|
8
|
+
}
|
|
@@ -0,0 +1,17 @@
|
|
|
1
|
+
import { ResourceFetcher } from '../../utils/ResourceFetcher';
|
|
2
|
+
import { ETError, getError } from '../../Error';
|
|
3
|
+
import { BaseNonStaticModule } from '../BaseNonStaticModule';
|
|
4
|
+
export class StyleTransferModule extends BaseNonStaticModule {
|
|
5
|
+
async load(model, onDownloadProgressCallback = () => { }) {
|
|
6
|
+
const paths = await ResourceFetcher.fetch(onDownloadProgressCallback, model.modelSource);
|
|
7
|
+
if (paths === null || paths.length < 1) {
|
|
8
|
+
throw new Error('Download interrupted.');
|
|
9
|
+
}
|
|
10
|
+
this.nativeModule = global.loadStyleTransfer(paths[0] || '');
|
|
11
|
+
}
|
|
12
|
+
async forward(imageSource) {
|
|
13
|
+
if (this.nativeModule == null)
|
|
14
|
+
throw new Error(getError(ETError.ModuleNotLoaded));
|
|
15
|
+
return await this.nativeModule.generate(imageSource);
|
|
16
|
+
}
|
|
17
|
+
}
|
|
@@ -0,0 +1,15 @@
|
|
|
1
|
+
import { ResourceSource } from '../../types/common';
|
|
2
|
+
import { OCRLanguage } from '../../types/ocr';
|
|
3
|
+
export declare class VerticalOCRModule {
|
|
4
|
+
private controller;
|
|
5
|
+
constructor();
|
|
6
|
+
load(model: {
|
|
7
|
+
detectorLarge: ResourceSource;
|
|
8
|
+
detectorNarrow: ResourceSource;
|
|
9
|
+
recognizerLarge: ResourceSource;
|
|
10
|
+
recognizerSmall: ResourceSource;
|
|
11
|
+
language: OCRLanguage;
|
|
12
|
+
}, independentCharacters: boolean, onDownloadProgressCallback?: (progress: number) => void): Promise<void>;
|
|
13
|
+
forward(input: string): Promise<any>;
|
|
14
|
+
delete(): void;
|
|
15
|
+
}
|