npm - @volley/recognition-client-sdk - Versions diffs - 0.1.767 → 0.1.782 - Mend

@volley/recognition-client-sdk 0.1.767 → 0.1.782

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (13) hide show

package/README.md +4 -1
package/dist/browser.bundled.d.ts +196 -119
package/dist/index.bundled.d.ts +204 -121
package/dist/index.d.ts +1 -1
package/dist/index.d.ts.map +1 -1
package/dist/index.js +41 -3
package/dist/index.js.map +3 -3
package/dist/recog-client-sdk.browser.js +40 -3
package/dist/recog-client-sdk.browser.js.map +3 -3
package/dist/recognition-client.d.ts.map +1 -1
package/package.json +3 -3
package/src/index.ts +1 -0
package/src/recognition-client.ts +6 -0

package/dist/recog-client-sdk.browser.js CHANGED Viewed

@@ -3749,6 +3749,7 @@ var RecognitionProvider;
   RecognitionProvider2["BEDROCK"] = "bedrock";
   RecognitionProvider2["INWORLD_STT"] = "inworld-stt";
   RecognitionProvider2["AWS_TRANSCRIBE"] = "aws-transcribe";
+  RecognitionProvider2["AMAZON_NOVA_SONIC"] = "amazon-nova-sonic";
   RecognitionProvider2["TEST_ASR_PROVIDER_QUOTA"] = "test-asr-provider-quota";
   RecognitionProvider2["TEST_ASR_STREAMING"] = "test-asr-streaming";
 })(RecognitionProvider || (RecognitionProvider = {}));
@@ -3799,6 +3800,7 @@ var ElevenLabsModel;
 })(ElevenLabsModel || (ElevenLabsModel = {}));
 var OpenAIRealtimeModel;
 (function(OpenAIRealtimeModel2) {
+  OpenAIRealtimeModel2["GPT_REALTIME_WHISPER"] = "gpt-realtime-whisper";
   OpenAIRealtimeModel2["GPT_4O_TRANSCRIBE"] = "gpt-4o-transcribe";
   OpenAIRealtimeModel2["GPT_4O_MINI_TRANSCRIBE"] = "gpt-4o-mini-transcribe";
 })(OpenAIRealtimeModel || (OpenAIRealtimeModel = {}));
@@ -3829,6 +3831,11 @@ var AwsTranscribeModel;
 (function(AwsTranscribeModel2) {
   AwsTranscribeModel2["DEFAULT"] = "default";
 })(AwsTranscribeModel || (AwsTranscribeModel = {}));
+var AmazonNovaSonicModel;
+(function(AmazonNovaSonicModel2) {
+  AmazonNovaSonicModel2["AMAZON_NOVA_SONIC_V1"] = "amazon.nova-sonic-v1:0";
+  AmazonNovaSonicModel2["AMAZON_NOVA_2_SONIC"] = "amazon.nova-2-sonic-v1:0";
+})(AmazonNovaSonicModel || (AmazonNovaSonicModel = {}));
 var SelfServeVllmModel;
 (function(SelfServeVllmModel2) {
   SelfServeVllmModel2["QWEN3_ASR_1_7B"] = "qwen3-asr-1.7b";
@@ -3845,6 +3852,18 @@ var RecognitionResultTypeV1;
   RecognitionResultTypeV12["AUDIO_METRICS"] = "AudioMetrics";
   RecognitionResultTypeV12["SESSION_CONFIGURED"] = "SessionConfigured";
 })(RecognitionResultTypeV1 || (RecognitionResultTypeV1 = {}));
+var DetectionTypeV1;
+(function(DetectionTypeV12) {
+  DetectionTypeV12["SEARCH"] = "search";
+})(DetectionTypeV1 || (DetectionTypeV1 = {}));
+var DetectionV1Schema = z.object({
+  type: z.nativeEnum(DetectionTypeV1),
+  query: z.string(),
+  score: z.number().min(0).max(1),
+  startMs: z.number().optional(),
+  endMs: z.number().optional()
+  // Audio time (ms from stream start) where the hit ends
+});
 var TranscriptionResultSchemaV1 = z.object({
   type: z.literal(RecognitionResultTypeV1.TRANSCRIPTION),
   audioUtteranceId: z.string(),
@@ -3863,8 +3882,9 @@ var TranscriptionResultSchemaV1 = z.object({
   endTimestamp: z.number().optional(),
   receivedAtMs: z.number().optional(),
   accumulatedAudioTimeMs: z.number().optional(),
-  rawAudioTimeMs: z.number().optional()
-  // Total audio duration sent to provider (includes prefix)
+  rawAudioTimeMs: z.number().optional(),
+  detections: z.array(DetectionV1Schema).optional()
+  // Provider-reported phrase detections (query + score, optionally startMs/endMs). Always populated when the provider returns hits, regardless of `appendSearch`. Other providers leave this undefined.
 });
 var FunctionCallResultSchemaV1 = z.object({
   type: z.literal(RecognitionResultTypeV1.FUNCTION_CALL),
@@ -4117,7 +4137,15 @@ var TranscriptMessageSchema = z.object({
    * @example true
    * @default false
    */
-  is_fallback: z.boolean().optional()
+  is_fallback: z.boolean().optional(),
+  /**
+   * Provider-reported phrase detections (query + score, optionally
+   * startMs/endMs). Always populated when the provider returns hits,
+   * regardless of `appendSearch` or scene gating. Other providers leave
+   * this undefined.
+   * @example [{ query: 'justin bieber one time', score: 0.78, startMs: 1200, endMs: 2800 }]
+   */
+  detections: z.array(DetectionV1Schema).optional()
 });
 var VADEndSignalSchema = z.object({
   type: z.literal(ProviderMessageType.VAD_END_SIGNAL),
@@ -4434,6 +4462,9 @@ var ASRRequestSchemaV1 = z.object({
   // Streaming audio metrics opt-in: when > 0, server emits AudioMetrics results throttled to this interval (ms).
   // Undefined / 0 disables streaming audio metrics (final metrics still embedded in Metadata).
   audioMetricsIntervalMs: z.number().optional(),
+  // Opt-in: round-trip Deepgram `search` phrase hits into the transcript.
+  // Active only when (model = deepgram nova-2) AND (GameContext.gamePhase = 'Solve Puzzle'). See ASRRequestConfig.appendSearch in asr-config.types.ts for full semantics.
+  appendSearch: z.boolean().optional(),
   // Debug options (FOR DEBUG/TESTING ONLY - not for production use)
   debugCommand: RequestDebugCommandSchema
 });
@@ -5759,6 +5790,12 @@ var RealTimeTwoWayWebSocketRecognitionClient = class _RealTimeTwoWayWebSocketRec
         // Streaming audio metrics opt-in (ms interval). Server only forwards metrics if > 0.
         ...this.config.asrRequestConfig.audioMetricsIntervalMs !== void 0 && {
           audioMetricsIntervalMs: this.config.asrRequestConfig.audioMetricsIntervalMs
+        },
+        // Opt-in: round-trip Deepgram nova-2 search-phrase hits into the
+        // transcript. Only fires server-side when (model = nova-2) AND
+        // (GameContext.gamePhase = 'Solve Puzzle'). See ASRRequestConfig.appendSearch.
+        ...this.config.asrRequestConfig.appendSearch !== void 0 && {
+          appendSearch: this.config.asrRequestConfig.appendSearch
         }
       };
       super.sendMessage(