sherpa-onnx-node 1.12.28 → 1.12.30
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/addon.js +2 -2
- package/online-speech-denoiser.js +45 -0
- package/package.json +7 -7
- package/sherpa-onnx.js +2 -0
- package/types.js +58 -29
package/addon.js
CHANGED
|
@@ -51,7 +51,7 @@ if (!addon) {
|
|
|
51
51
|
!process.env.DYLD_LIBRARY_PATH.includes(
|
|
52
52
|
`node_modules/sherpa-onnx-${platform_arch}`))) {
|
|
53
53
|
msg +=
|
|
54
|
-
'Please
|
|
54
|
+
'Please remember to set the following environment variable and try again:\n';
|
|
55
55
|
|
|
56
56
|
msg += `export DYLD_LIBRARY_PATH=${addon_path}`;
|
|
57
57
|
|
|
@@ -63,7 +63,7 @@ if (!addon) {
|
|
|
63
63
|
!process.env.LD_LIBRARY_PATH.includes(
|
|
64
64
|
`node_modules/sherpa-onnx-${platform_arch}`))) {
|
|
65
65
|
msg +=
|
|
66
|
-
'Please
|
|
66
|
+
'Please remember to set the following environment variable and try again:\n';
|
|
67
67
|
|
|
68
68
|
msg += `export LD_LIBRARY_PATH=${addon_path}`;
|
|
69
69
|
|
|
@@ -0,0 +1,45 @@
|
|
|
1
|
+
/** @typedef {import('./types').OnlineSpeechDenoiserConfig} OnlineSpeechDenoiserConfig */
|
|
2
|
+
/** @typedef {import('./types').GeneratedAudio} GeneratedAudio */
|
|
3
|
+
/** @typedef {import('./types').AudioProcessRequest} AudioProcessRequest */
|
|
4
|
+
|
|
5
|
+
const addon = require('./addon.js');
|
|
6
|
+
|
|
7
|
+
class OnlineSpeechDenoiser {
|
|
8
|
+
/**
|
|
9
|
+
* @param {OnlineSpeechDenoiserConfig} config
|
|
10
|
+
*/
|
|
11
|
+
constructor(config) {
|
|
12
|
+
this.handle = addon.createOnlineSpeechDenoiser(config);
|
|
13
|
+
this.config = config;
|
|
14
|
+
|
|
15
|
+
this.sampleRate =
|
|
16
|
+
addon.onlineSpeechDenoiserGetSampleRateWrapper(this.handle);
|
|
17
|
+
this.frameShiftInSamples =
|
|
18
|
+
addon.onlineSpeechDenoiserGetFrameShiftInSamplesWrapper(this.handle);
|
|
19
|
+
}
|
|
20
|
+
|
|
21
|
+
/**
|
|
22
|
+
* @param {AudioProcessRequest} obj
|
|
23
|
+
* @returns {GeneratedAudio}
|
|
24
|
+
*/
|
|
25
|
+
run(obj) {
|
|
26
|
+
return addon.onlineSpeechDenoiserRunWrapper(this.handle, obj);
|
|
27
|
+
}
|
|
28
|
+
|
|
29
|
+
/**
|
|
30
|
+
* @param {boolean} [enableExternalBuffer=true]
|
|
31
|
+
* @returns {GeneratedAudio}
|
|
32
|
+
*/
|
|
33
|
+
flush(enableExternalBuffer = true) {
|
|
34
|
+
return addon.onlineSpeechDenoiserFlushWrapper(
|
|
35
|
+
this.handle, enableExternalBuffer);
|
|
36
|
+
}
|
|
37
|
+
|
|
38
|
+
reset() {
|
|
39
|
+
addon.onlineSpeechDenoiserResetWrapper(this.handle);
|
|
40
|
+
}
|
|
41
|
+
}
|
|
42
|
+
|
|
43
|
+
module.exports = {
|
|
44
|
+
OnlineSpeechDenoiser,
|
|
45
|
+
};
|
package/package.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
{
|
|
2
2
|
"name": "sherpa-onnx-node",
|
|
3
|
-
"version": "1.12.
|
|
3
|
+
"version": "1.12.30",
|
|
4
4
|
"description": "Speech-to-text, text-to-speech, speaker diarization, and speech enhancement using Next-gen Kaldi without internet connection",
|
|
5
5
|
"main": "sherpa-onnx.js",
|
|
6
6
|
"scripts": {
|
|
@@ -57,11 +57,11 @@
|
|
|
57
57
|
},
|
|
58
58
|
"homepage": "https://github.com/csukuangfj/sherpa-onnx#readme",
|
|
59
59
|
"optionalDependencies": {
|
|
60
|
-
"sherpa-onnx-darwin-arm64": "^1.12.
|
|
61
|
-
"sherpa-onnx-darwin-x64": "^1.12.
|
|
62
|
-
"sherpa-onnx-linux-x64": "^1.12.
|
|
63
|
-
"sherpa-onnx-linux-arm64": "^1.12.
|
|
64
|
-
"sherpa-onnx-win-x64": "^1.12.
|
|
65
|
-
"sherpa-onnx-win-ia32": "^1.12.
|
|
60
|
+
"sherpa-onnx-darwin-arm64": "^1.12.30",
|
|
61
|
+
"sherpa-onnx-darwin-x64": "^1.12.30",
|
|
62
|
+
"sherpa-onnx-linux-x64": "^1.12.30",
|
|
63
|
+
"sherpa-onnx-linux-arm64": "^1.12.30",
|
|
64
|
+
"sherpa-onnx-win-x64": "^1.12.30",
|
|
65
|
+
"sherpa-onnx-win-ia32": "^1.12.30"
|
|
66
66
|
}
|
|
67
67
|
}
|
package/sherpa-onnx.js
CHANGED
|
@@ -18,6 +18,7 @@ const punct = require('./punctuation.js');
|
|
|
18
18
|
const kws = require('./keyword-spotter.js');
|
|
19
19
|
const sd = require('./non-streaming-speaker-diarization.js');
|
|
20
20
|
const speech_denoiser = require('./non-streaming-speech-denoiser.js');
|
|
21
|
+
const online_speech_denoiser = require('./online-speech-denoiser.js');
|
|
21
22
|
|
|
22
23
|
module.exports = {
|
|
23
24
|
OnlineRecognizer : streaming_asr.OnlineRecognizer,
|
|
@@ -38,6 +39,7 @@ module.exports = {
|
|
|
38
39
|
KeywordSpotter : kws.KeywordSpotter,
|
|
39
40
|
OfflineSpeakerDiarization : sd.OfflineSpeakerDiarization,
|
|
40
41
|
OfflineSpeechDenoiser : speech_denoiser.OfflineSpeechDenoiser,
|
|
42
|
+
OnlineSpeechDenoiser : online_speech_denoiser.OnlineSpeechDenoiser,
|
|
41
43
|
version : addon.version,
|
|
42
44
|
gitSha1 : addon.gitSha1,
|
|
43
45
|
gitDate : addon.gitDate,
|
package/types.js
CHANGED
|
@@ -52,7 +52,7 @@
|
|
|
52
52
|
|
|
53
53
|
/**
|
|
54
54
|
* @typedef {Object} OfflinePunctuationHandle
|
|
55
|
-
* @see src/punctuation.cc
|
|
55
|
+
* @see src/offline-punctuation.cc
|
|
56
56
|
*/
|
|
57
57
|
|
|
58
58
|
/**
|
|
@@ -501,10 +501,24 @@
|
|
|
501
501
|
* @property {number} [lengthScale]
|
|
502
502
|
*/
|
|
503
503
|
|
|
504
|
-
/**
|
|
505
|
-
* @typedef {Object}
|
|
506
|
-
* @property {string} [
|
|
507
|
-
* @property {string} [
|
|
504
|
+
/**
|
|
505
|
+
* @typedef {Object} OfflineTtsZipvoiceModelConfig
|
|
506
|
+
* @property {string} [tokens]
|
|
507
|
+
* @property {string} [encoder]
|
|
508
|
+
* @property {string} [decoder]
|
|
509
|
+
* @property {string} [vocoder]
|
|
510
|
+
* @property {string} [dataDir]
|
|
511
|
+
* @property {string} [lexicon]
|
|
512
|
+
* @property {number} [featScale]
|
|
513
|
+
* @property {number} [tShift]
|
|
514
|
+
* @property {number} [targetRms]
|
|
515
|
+
* @property {number} [guidanceScale]
|
|
516
|
+
*/
|
|
517
|
+
|
|
518
|
+
/**
|
|
519
|
+
* @typedef {Object} OfflineTtsPocketModelConfig
|
|
520
|
+
* @property {string} [lmFlow]
|
|
521
|
+
* @property {string} [lmMain]
|
|
508
522
|
* @property {string} [encoder]
|
|
509
523
|
* @property {string} [decoder]
|
|
510
524
|
* @property {string} [textConditioner]
|
|
@@ -517,11 +531,12 @@
|
|
|
517
531
|
* Offline TTS model config
|
|
518
532
|
* @typedef {Object} OfflineTtsModelConfig
|
|
519
533
|
* @property {OfflineTtsVitsModelConfig} [vits]
|
|
520
|
-
* @property {OfflineTtsMatchaModelConfig} [matcha]
|
|
521
|
-
* @property {OfflineTtsKokoroModelConfig} [kokoro]
|
|
522
|
-
* @property {OfflineTtsKittenModelConfig} [kitten]
|
|
523
|
-
* @property {
|
|
524
|
-
|
|
534
|
+
* @property {OfflineTtsMatchaModelConfig} [matcha]
|
|
535
|
+
* @property {OfflineTtsKokoroModelConfig} [kokoro]
|
|
536
|
+
* @property {OfflineTtsKittenModelConfig} [kitten]
|
|
537
|
+
* @property {OfflineTtsZipvoiceModelConfig} [zipvoice]
|
|
538
|
+
* @property {OfflineTtsPocketModelConfig} [pocket]
|
|
539
|
+
*/
|
|
525
540
|
|
|
526
541
|
/**
|
|
527
542
|
* Offline TTS configuration (partial, commonly used props).
|
|
@@ -533,25 +548,39 @@
|
|
|
533
548
|
* @property {string} [provider]
|
|
534
549
|
*/
|
|
535
550
|
|
|
536
|
-
/**
|
|
537
|
-
* Offline Speech Denoiser model config
|
|
538
|
-
* @typedef {Object} OfflineSpeechDenoiserGtcrnModelConfig
|
|
539
|
-
* @property {string} [model]
|
|
540
|
-
*/
|
|
541
|
-
|
|
542
|
-
/**
|
|
543
|
-
* Offline Speech Denoiser model config
|
|
544
|
-
* @typedef {Object}
|
|
545
|
-
* @property {
|
|
546
|
-
*/
|
|
547
|
-
|
|
548
|
-
/**
|
|
549
|
-
* Offline Speech Denoiser
|
|
550
|
-
* @typedef {Object}
|
|
551
|
-
* @property {
|
|
552
|
-
* @property {
|
|
553
|
-
* @property {
|
|
554
|
-
|
|
551
|
+
/**
|
|
552
|
+
* Offline Speech Denoiser model config
|
|
553
|
+
* @typedef {Object} OfflineSpeechDenoiserGtcrnModelConfig
|
|
554
|
+
* @property {string} [model]
|
|
555
|
+
*/
|
|
556
|
+
|
|
557
|
+
/**
|
|
558
|
+
* Offline Speech Denoiser model config
|
|
559
|
+
* @typedef {Object} OfflineSpeechDenoiserDpdfNetModelConfig
|
|
560
|
+
* @property {string} [model]
|
|
561
|
+
*/
|
|
562
|
+
|
|
563
|
+
/**
|
|
564
|
+
* Offline Speech Denoiser model config
|
|
565
|
+
* @typedef {Object} OfflineSpeechDenoiserModelConfig
|
|
566
|
+
* @property {OfflineSpeechDenoiserGtcrnModelConfig} [gtcrn]
|
|
567
|
+
* @property {OfflineSpeechDenoiserDpdfNetModelConfig} [dpdfnet]
|
|
568
|
+
* @property {number} [numThreads]
|
|
569
|
+
* @property {boolean|number} [debug]
|
|
570
|
+
* @property {string} [provider]
|
|
571
|
+
*/
|
|
572
|
+
|
|
573
|
+
/**
|
|
574
|
+
* Offline Speech Denoiser configuration (partial).
|
|
575
|
+
* @typedef {Object} OfflineSpeechDenoiserConfig
|
|
576
|
+
* @property {OfflineSpeechDenoiserModelConfig} [model]
|
|
577
|
+
*/
|
|
578
|
+
|
|
579
|
+
/**
|
|
580
|
+
* Online Speech Denoiser configuration (partial).
|
|
581
|
+
* @typedef {Object} OnlineSpeechDenoiserConfig
|
|
582
|
+
* @property {OfflineSpeechDenoiserModelConfig} [model]
|
|
583
|
+
*/
|
|
555
584
|
|
|
556
585
|
/**
|
|
557
586
|
* Offline speaker segmentation (pyannote) model config
|