npm - @layercode/js-sdk - Versions diffs - 1.0.15 → 1.0.17 - Mend

@layercode/js-sdk 1.0.15 → 1.0.17

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (7) hide show

package/dist/layercode-js-sdk.esm.js +69 -22
package/dist/layercode-js-sdk.esm.js.map +1 -1
package/dist/layercode-js-sdk.min.js +69 -22
package/dist/layercode-js-sdk.min.js.map +1 -1
package/dist/types/index.d.ts +1 -0
package/dist/types/interfaces.d.ts +6 -2
package/package.json +3 -2

package/dist/layercode-js-sdk.min.js CHANGED Viewed

@@ -3506,13 +3506,58 @@ registerProcessor('audio_processor', AudioProcessor);
           this.vadPausedPlayer = false;
           this.pushToTalkEnabled = false;
           this.canInterrupt = false;
+          this.userIsSpeaking = false;
           // Bind event handlers
           this._handleWebSocketMessage = this._handleWebSocketMessage.bind(this);
           this._handleDataAvailable = this._handleDataAvailable.bind(this);
       }
       _initializeVAD() {
           console.log('initializing VAD', { pushToTalkEnabled: this.pushToTalkEnabled, canInterrupt: this.canInterrupt });
-          if (!this.pushToTalkEnabled && this.canInterrupt) {
+          // If we're in push to talk mode, we don't need to use the VAD model
+          if (this.pushToTalkEnabled) {
+              return;
+          }
+          const timeout = setTimeout(() => {
+              console.log('silero vad model timeout');
+              // TODO: send message to server to indicate that the vad model timed out
+              this.userIsSpeaking = true; // allow audio to be sent to the server
+          }, 2000);
+          if (!this.canInterrupt) {
+              dist.MicVAD.new({
+                  stream: this.wavRecorder.getStream() || undefined,
+                  model: 'v5',
+                  positiveSpeechThreshold: 0.3,
+                  negativeSpeechThreshold: 0.2,
+                  redemptionFrames: 25, // Number of frames of silence before onVADMisfire or onSpeechEnd is called. Effectively a delay before restarting.
+                  minSpeechFrames: 15,
+                  preSpeechPadFrames: 0,
+                  onSpeechStart: () => {
+                      if (!this.wavPlayer.isPlaying) {
+                          this.userIsSpeaking = true;
+                      }
+                  },
+                  onVADMisfire: () => {
+                      this.userIsSpeaking = false;
+                  },
+                  onSpeechEnd: () => {
+                      this.userIsSpeaking = false;
+                      this._wsSend({
+                          type: 'vad_events',
+                          event: 'vad_end',
+                      });
+                  },
+              })
+                  .then((vad) => {
+                  clearTimeout(timeout);
+                  this.vad = vad;
+                  this.vad.start();
+                  console.log('VAD started');
+              })
+                  .catch((error) => {
+                  console.error('Error initializing VAD:', error);
+              });
+          }
+          else {
               dist.MicVAD.new({
                   stream: this.wavRecorder.getStream() || undefined,
                   model: 'v5',
@@ -3533,36 +3578,35 @@ registerProcessor('audio_processor', AudioProcessor);
                       else {
                           console.log('onSpeechStart: WavPlayer is not playing, VAD will not pause.');
                       }
+                      this.userIsSpeaking = true;
+                      console.log('onSpeechStart: sending vad_start');
+                      this._wsSend({
+                          type: 'vad_events',
+                          event: 'vad_start',
+                      });
                   },
                   onVADMisfire: () => {
                       // If the speech detected was for less than minSpeechFrames, this is called instead of onSpeechEnd, and we should resume the assistant audio as it was a false interruption. We include a configurable delay so the assistant isn't too quick to start speaking again.
+                      this.userIsSpeaking = false;
                       if (this.vadPausedPlayer) {
                           console.log('onSpeechEnd: VAD paused the player, resuming');
                           this.wavPlayer.play();
                           this.vadPausedPlayer = false; // Reset flag
-                          // Option to extend delay in the case where the transcriber takes longer to detect a new turn
-                          // console.log('onVADMisfire: VAD paused the player, resuming in ' + this.options.vadResumeDelay + 'ms');
-                          // // Add configurable delay before resuming playback
-                          // setTimeout(() => {
-                          //   this.wavPlayer.play();
-                          //   this.vadPausedPlayer = false; // Reset flag
-                          // }, this.options.vadResumeDelay);
                       }
                       else {
                           console.log('onVADMisfire: VAD did not pause the player, no action taken to resume.');
                       }
                   },
-                  // onSpeechEnd: () => {
-                  //   if (this.vadPausedPlayer) {
-                  //     console.log('onSpeechEnd: VAD paused the player, resuming');
-                  //     this.wavPlayer.play();
-                  //     this.vadPausedPlayer = false; // Reset flag
-                  //   } else {
-                  //     console.log('onSpeechEnd: VAD did not pause the player, not resuming.');
-                  //   }
-                  // },
+                  onSpeechEnd: () => {
+                      this.userIsSpeaking = false;
+                      this._wsSend({
+                          type: 'vad_events',
+                          event: 'vad_end',
+                      });
+                  },
               })
                   .then((vad) => {
+                  clearTimeout(timeout);
                   this.vad = vad;
                   this.vad.start();
                   console.log('VAD started');
@@ -3670,10 +3714,13 @@ registerProcessor('audio_processor', AudioProcessor);
       _handleDataAvailable(data) {
           try {
               const base64 = arrayBufferToBase64(data.mono);
-              this._wsSend({
-                  type: 'client.audio',
-                  content: base64,
-              });
+              const sendAudio = this.pushToTalkEnabled ? this.pushToTalkActive : this.userIsSpeaking;
+              if (sendAudio) {
+                  this._wsSend({
+                      type: 'client.audio',
+                      content: base64,
+                  });
+              }
           }
           catch (error) {
               console.error('Error processing audio:', error);
@@ -3778,7 +3825,7 @@ registerProcessor('audio_processor', AudioProcessor);
               };
               // Initialize microphone audio capture
               await this.wavRecorder.begin();
-              await this.wavRecorder.record(this._handleDataAvailable);
+              await this.wavRecorder.record(this._handleDataAvailable, 1638);
               // Set up microphone amplitude monitoring
               this._setupAmplitudeMonitoring(this.wavRecorder, this.options.onUserAmplitudeChange, (amp) => (this.userAudioAmplitude = amp));
               // Initialize audio player