sherpa-onnx-node 1.12.28 → 1.12.30

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
package/addon.js CHANGED
@@ -51,7 +51,7 @@ if (!addon) {
51
51
  !process.env.DYLD_LIBRARY_PATH.includes(
52
52
  `node_modules/sherpa-onnx-${platform_arch}`))) {
53
53
  msg +=
54
- 'Please remeber to set the following environment variable and try again:\n';
54
+ 'Please remember to set the following environment variable and try again:\n';
55
55
 
56
56
  msg += `export DYLD_LIBRARY_PATH=${addon_path}`;
57
57
 
@@ -63,7 +63,7 @@ if (!addon) {
63
63
  !process.env.LD_LIBRARY_PATH.includes(
64
64
  `node_modules/sherpa-onnx-${platform_arch}`))) {
65
65
  msg +=
66
- 'Please remeber to set the following environment variable and try again:\n';
66
+ 'Please remember to set the following environment variable and try again:\n';
67
67
 
68
68
  msg += `export LD_LIBRARY_PATH=${addon_path}`;
69
69
 
@@ -0,0 +1,45 @@
1
+ /** @typedef {import('./types').OnlineSpeechDenoiserConfig} OnlineSpeechDenoiserConfig */
2
+ /** @typedef {import('./types').GeneratedAudio} GeneratedAudio */
3
+ /** @typedef {import('./types').AudioProcessRequest} AudioProcessRequest */
4
+
5
+ const addon = require('./addon.js');
6
+
7
+ class OnlineSpeechDenoiser {
8
+ /**
9
+ * @param {OnlineSpeechDenoiserConfig} config
10
+ */
11
+ constructor(config) {
12
+ this.handle = addon.createOnlineSpeechDenoiser(config);
13
+ this.config = config;
14
+
15
+ this.sampleRate =
16
+ addon.onlineSpeechDenoiserGetSampleRateWrapper(this.handle);
17
+ this.frameShiftInSamples =
18
+ addon.onlineSpeechDenoiserGetFrameShiftInSamplesWrapper(this.handle);
19
+ }
20
+
21
+ /**
22
+ * @param {AudioProcessRequest} obj
23
+ * @returns {GeneratedAudio}
24
+ */
25
+ run(obj) {
26
+ return addon.onlineSpeechDenoiserRunWrapper(this.handle, obj);
27
+ }
28
+
29
+ /**
30
+ * @param {boolean} [enableExternalBuffer=true]
31
+ * @returns {GeneratedAudio}
32
+ */
33
+ flush(enableExternalBuffer = true) {
34
+ return addon.onlineSpeechDenoiserFlushWrapper(
35
+ this.handle, enableExternalBuffer);
36
+ }
37
+
38
+ reset() {
39
+ addon.onlineSpeechDenoiserResetWrapper(this.handle);
40
+ }
41
+ }
42
+
43
+ module.exports = {
44
+ OnlineSpeechDenoiser,
45
+ };
package/package.json CHANGED
@@ -1,6 +1,6 @@
1
1
  {
2
2
  "name": "sherpa-onnx-node",
3
- "version": "1.12.28",
3
+ "version": "1.12.30",
4
4
  "description": "Speech-to-text, text-to-speech, speaker diarization, and speech enhancement using Next-gen Kaldi without internet connection",
5
5
  "main": "sherpa-onnx.js",
6
6
  "scripts": {
@@ -57,11 +57,11 @@
57
57
  },
58
58
  "homepage": "https://github.com/csukuangfj/sherpa-onnx#readme",
59
59
  "optionalDependencies": {
60
- "sherpa-onnx-darwin-arm64": "^1.12.28",
61
- "sherpa-onnx-darwin-x64": "^1.12.28",
62
- "sherpa-onnx-linux-x64": "^1.12.28",
63
- "sherpa-onnx-linux-arm64": "^1.12.28",
64
- "sherpa-onnx-win-x64": "^1.12.28",
65
- "sherpa-onnx-win-ia32": "^1.12.28"
60
+ "sherpa-onnx-darwin-arm64": "^1.12.30",
61
+ "sherpa-onnx-darwin-x64": "^1.12.30",
62
+ "sherpa-onnx-linux-x64": "^1.12.30",
63
+ "sherpa-onnx-linux-arm64": "^1.12.30",
64
+ "sherpa-onnx-win-x64": "^1.12.30",
65
+ "sherpa-onnx-win-ia32": "^1.12.30"
66
66
  }
67
67
  }
package/sherpa-onnx.js CHANGED
@@ -18,6 +18,7 @@ const punct = require('./punctuation.js');
18
18
  const kws = require('./keyword-spotter.js');
19
19
  const sd = require('./non-streaming-speaker-diarization.js');
20
20
  const speech_denoiser = require('./non-streaming-speech-denoiser.js');
21
+ const online_speech_denoiser = require('./online-speech-denoiser.js');
21
22
 
22
23
  module.exports = {
23
24
  OnlineRecognizer : streaming_asr.OnlineRecognizer,
@@ -38,6 +39,7 @@ module.exports = {
38
39
  KeywordSpotter : kws.KeywordSpotter,
39
40
  OfflineSpeakerDiarization : sd.OfflineSpeakerDiarization,
40
41
  OfflineSpeechDenoiser : speech_denoiser.OfflineSpeechDenoiser,
42
+ OnlineSpeechDenoiser : online_speech_denoiser.OnlineSpeechDenoiser,
41
43
  version : addon.version,
42
44
  gitSha1 : addon.gitSha1,
43
45
  gitDate : addon.gitDate,
package/types.js CHANGED
@@ -52,7 +52,7 @@
52
52
 
53
53
  /**
54
54
  * @typedef {Object} OfflinePunctuationHandle
55
- * @see src/punctuation.cc
55
+ * @see src/offline-punctuation.cc
56
56
  */
57
57
 
58
58
  /**
@@ -501,10 +501,24 @@
501
501
  * @property {number} [lengthScale]
502
502
  */
503
503
 
504
- /**
505
- * @typedef {Object} OfflineTtsPocketModelConfig
506
- * @property {string} [lmFlow]
507
- * @property {string} [lmMain]
504
+ /**
505
+ * @typedef {Object} OfflineTtsZipvoiceModelConfig
506
+ * @property {string} [tokens]
507
+ * @property {string} [encoder]
508
+ * @property {string} [decoder]
509
+ * @property {string} [vocoder]
510
+ * @property {string} [dataDir]
511
+ * @property {string} [lexicon]
512
+ * @property {number} [featScale]
513
+ * @property {number} [tShift]
514
+ * @property {number} [targetRms]
515
+ * @property {number} [guidanceScale]
516
+ */
517
+
518
+ /**
519
+ * @typedef {Object} OfflineTtsPocketModelConfig
520
+ * @property {string} [lmFlow]
521
+ * @property {string} [lmMain]
508
522
  * @property {string} [encoder]
509
523
  * @property {string} [decoder]
510
524
  * @property {string} [textConditioner]
@@ -517,11 +531,12 @@
517
531
  * Offline TTS model config
518
532
  * @typedef {Object} OfflineTtsModelConfig
519
533
  * @property {OfflineTtsVitsModelConfig} [vits]
520
- * @property {OfflineTtsMatchaModelConfig} [matcha]
521
- * @property {OfflineTtsKokoroModelConfig} [kokoro]
522
- * @property {OfflineTtsKittenModelConfig} [kitten]
523
- * @property {OfflineTtsPocketModelConfig} [pocket]
524
- */
534
+ * @property {OfflineTtsMatchaModelConfig} [matcha]
535
+ * @property {OfflineTtsKokoroModelConfig} [kokoro]
536
+ * @property {OfflineTtsKittenModelConfig} [kitten]
537
+ * @property {OfflineTtsZipvoiceModelConfig} [zipvoice]
538
+ * @property {OfflineTtsPocketModelConfig} [pocket]
539
+ */
525
540
 
526
541
  /**
527
542
  * Offline TTS configuration (partial, commonly used props).
@@ -533,25 +548,39 @@
533
548
  * @property {string} [provider]
534
549
  */
535
550
 
536
- /**
537
- * Offline Speech Denoiser model config
538
- * @typedef {Object} OfflineSpeechDenoiserGtcrnModelConfig
539
- * @property {string} [model]
540
- */
541
-
542
- /**
543
- * Offline Speech Denoiser model config
544
- * @typedef {Object} OfflineSpeechDenoiserModelConfig
545
- * @property {OfflineSpeechDenoiserGtcrnModelConfig} [gtcrn]
546
- */
547
-
548
- /**
549
- * Offline Speech Denoiser configuration (partial).
550
- * @typedef {Object} OfflineSpeechDenoiserConfig
551
- * @property {OfflineSpeechDenoiserModelConfig} [model]
552
- * @property {number} [numThreads]
553
- * @property {string} [provider]
554
- */
551
+ /**
552
+ * Offline Speech Denoiser model config
553
+ * @typedef {Object} OfflineSpeechDenoiserGtcrnModelConfig
554
+ * @property {string} [model]
555
+ */
556
+
557
+ /**
558
+ * Offline Speech Denoiser model config
559
+ * @typedef {Object} OfflineSpeechDenoiserDpdfNetModelConfig
560
+ * @property {string} [model]
561
+ */
562
+
563
+ /**
564
+ * Offline Speech Denoiser model config
565
+ * @typedef {Object} OfflineSpeechDenoiserModelConfig
566
+ * @property {OfflineSpeechDenoiserGtcrnModelConfig} [gtcrn]
567
+ * @property {OfflineSpeechDenoiserDpdfNetModelConfig} [dpdfnet]
568
+ * @property {number} [numThreads]
569
+ * @property {boolean|number} [debug]
570
+ * @property {string} [provider]
571
+ */
572
+
573
+ /**
574
+ * Offline Speech Denoiser configuration (partial).
575
+ * @typedef {Object} OfflineSpeechDenoiserConfig
576
+ * @property {OfflineSpeechDenoiserModelConfig} [model]
577
+ */
578
+
579
+ /**
580
+ * Online Speech Denoiser configuration (partial).
581
+ * @typedef {Object} OnlineSpeechDenoiserConfig
582
+ * @property {OfflineSpeechDenoiserModelConfig} [model]
583
+ */
555
584
 
556
585
  /**
557
586
  * Offline speaker segmentation (pyannote) model config