npm - @qafka/react-native - Versions diffs - 2.3.2 → 2.3.4 - Mend

@qafka/react-native 2.3.2 → 2.3.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (8) hide show

package/android/src/main/AndroidManifest.xml +2 -0
package/android/src/main/java/com/qafka/audio/QafkaAudioModule.kt +48 -0
package/dist/native/QafkaAudio.d.ts +7 -0
package/dist/native/QafkaAudio.js +20 -0
package/dist/native/ensure-record-permission.d.ts +20 -0
package/dist/native/ensure-record-permission.js +11 -0
package/dist/services/RealtimeService.js +11 -0
package/package.json +1 -1

package/android/src/main/AndroidManifest.xml CHANGED Viewed

@@ -1,2 +1,4 @@
 <manifest xmlns:android="http://schemas.android.com/apk/res/android">
+    <!-- Required for voice capture. Merged into the consumer app manifest. -->
+    <uses-permission android:name="android.permission.RECORD_AUDIO" />
 </manifest>

package/android/src/main/java/com/qafka/audio/QafkaAudioModule.kt CHANGED Viewed

@@ -1,8 +1,11 @@
 package com.qafka.audio
 import android.Manifest
+import android.content.Context
 import android.content.pm.PackageManager
+import android.media.AudioAttributes
 import android.media.AudioFormat
+import android.media.AudioManager
 import android.media.AudioRecord
 import android.media.AudioTrack
 import android.media.MediaRecorder
@@ -33,6 +36,11 @@ class QafkaAudioModule(reactContext: ReactApplicationContext) :
     private var noiseSuppressor: NoiseSuppressor? = null
     private var automaticGainControl: AutomaticGainControl? = null
+    // Audio-mode state saved on startCapture and restored on stopCapture so the
+    // host app's audio routing is left exactly as we found it.
+    private var previousAudioMode: Int? = null
+    private var previousSpeakerphoneOn: Boolean? = null
     companion object {
         private const val TAG = "QafkaAudio"
         private const val CAPTURE_SAMPLE_RATE = 16000
@@ -110,6 +118,24 @@ class QafkaAudioModule(reactContext: ReactApplicationContext) :
         val bufferSize = maxOf(minBufferSize, 4096)
+        // iOS VPIO equivalent (part 1): put the audio system into communication
+        // mode and route both capture and playback through the voice path.
+        // Without this the AudioTrack below plays on the media path, which the
+        // VOICE_COMMUNICATION capture's echo canceler has no reference to — so
+        // the AI's own playback leaks back into the mic and it talks to itself.
+        try {
+            val audioManager =
+                reactApplicationContext.getSystemService(Context.AUDIO_SERVICE) as AudioManager
+            previousAudioMode = audioManager.mode
+            previousSpeakerphoneOn = audioManager.isSpeakerphoneOn
+            audioManager.mode = AudioManager.MODE_IN_COMMUNICATION
+            @Suppress("DEPRECATION")
+            audioManager.isSpeakerphoneOn = true
+            dlogI("✅ AudioManager mode=IN_COMMUNICATION, speakerphone=on")
+        } catch (e: Exception) {
+            dlogW("⚠️ Failed to set communication audio mode: ${e.message}")
+        }
         try {
             val record = AudioRecord(
                 MediaRecorder.AudioSource.VOICE_COMMUNICATION,
@@ -164,7 +190,16 @@ class QafkaAudioModule(reactContext: ReactApplicationContext) :
             )
             val playBufferSize = maxOf(playMinBuffer, 4096)
+            // iOS VPIO equivalent (part 2): play on the voice-communication path
+            // (USAGE_VOICE_COMMUNICATION + CONTENT_TYPE_SPEECH) so the echo
+            // canceler bound to the capture session can reference and cancel it.
             val track = AudioTrack.Builder()
+                .setAudioAttributes(
+                    AudioAttributes.Builder()
+                        .setUsage(AudioAttributes.USAGE_VOICE_COMMUNICATION)
+                        .setContentType(AudioAttributes.CONTENT_TYPE_SPEECH)
+                        .build()
+                )
                 .setAudioFormat(
                     AudioFormat.Builder()
                         .setSampleRate(PLAYBACK_SAMPLE_RATE)
@@ -247,6 +282,19 @@ class QafkaAudioModule(reactContext: ReactApplicationContext) :
         } catch (_: Exception) {}
         audioTrack = null
+        // Restore the host app's audio mode / routing exactly as we found it.
+        try {
+            val audioManager =
+                reactApplicationContext.getSystemService(Context.AUDIO_SERVICE) as AudioManager
+            previousAudioMode?.let { audioManager.mode = it }
+            previousSpeakerphoneOn?.let {
+                @Suppress("DEPRECATION")
+                audioManager.isSpeakerphoneOn = it
+            }
+        } catch (_: Exception) {}
+        previousAudioMode = null
+        previousSpeakerphoneOn = null
         promise.resolve(true)
     }

package/dist/native/QafkaAudio.d.ts CHANGED Viewed

@@ -1,4 +1,11 @@
 export declare const QafkaAudio: {
+    /**
+     * Ensure microphone access before capturing. iOS prompts natively inside
+     * startCapture; on Android the RECORD_AUDIO runtime permission is requested
+     * here (the platform never auto-prompts), otherwise capture starts denied and
+     * the voice stream is silent. Resolves to whether mic access is available.
+     */
+    ensureRecordPermission: () => Promise<boolean>;
     startCapture: () => Promise<boolean>;
     stopCapture: () => Promise<boolean>;
     playAudioChunk: (base64Data: string) => Promise<boolean>;

package/dist/native/QafkaAudio.js CHANGED Viewed

@@ -2,6 +2,7 @@
 Object.defineProperty(exports, "__esModule", { value: true });
 exports.QafkaAudio = void 0;
 const react_native_1 = require("react-native");
+const ensure_record_permission_1 = require("./ensure-record-permission");
 const { QafkaAudio: NativeQafkaAudio } = react_native_1.NativeModules;
 const emitter = NativeQafkaAudio ? new react_native_1.NativeEventEmitter(NativeQafkaAudio) : null;
 const MISSING_MODULE_MESSAGE = `QafkaAudio native module is not linked. ` +
@@ -15,6 +16,25 @@ const requireModule = () => {
     return NativeQafkaAudio;
 };
 exports.QafkaAudio = {
+    /**
+     * Ensure microphone access before capturing. iOS prompts natively inside
+     * startCapture; on Android the RECORD_AUDIO runtime permission is requested
+     * here (the platform never auto-prompts), otherwise capture starts denied and
+     * the voice stream is silent. Resolves to whether mic access is available.
+     */
+    ensureRecordPermission: () => (0, ensure_record_permission_1.ensureRecordPermission)({
+        os: react_native_1.Platform.OS,
+        check: () => react_native_1.PermissionsAndroid.check(react_native_1.PermissionsAndroid.PERMISSIONS.RECORD_AUDIO),
+        request: async () => {
+            const result = await react_native_1.PermissionsAndroid.request(react_native_1.PermissionsAndroid.PERMISSIONS.RECORD_AUDIO, {
+                title: 'Microphone permission',
+                message: 'Microphone access is required for voice conversations.',
+                buttonPositive: 'OK',
+                buttonNegative: 'Cancel',
+            });
+            return result === react_native_1.PermissionsAndroid.RESULTS.GRANTED;
+        },
+    }),
     startCapture: () => requireModule().startCapture(),
     stopCapture: () => requireModule().stopCapture(),
     playAudioChunk: (base64Data) => requireModule().playAudioChunk(base64Data),

package/dist/native/ensure-record-permission.d.ts ADDED Viewed

@@ -0,0 +1,20 @@
+/**
+ * Resolve microphone permission before voice capture starts.
+ *
+ * iOS requests the permission as part of starting native capture, so this is a
+ * no-op there. On Android the platform never auto-prompts for the runtime
+ * RECORD_AUDIO permission — it must be requested explicitly, otherwise capture
+ * starts denied and the voice stream stays silent.
+ *
+ * Kept pure and dependency-injected so it can be unit-tested without the
+ * react-native runtime; {@link QafkaAudio} wires the real platform calls in.
+ */
+export interface RecordPermissionDeps {
+    /** Platform.OS */
+    os: string;
+    /** Resolve whether RECORD_AUDIO is already granted. */
+    check: () => Promise<boolean>;
+    /** Prompt the user for RECORD_AUDIO; resolve whether it was granted. */
+    request: () => Promise<boolean>;
+}
+export declare function ensureRecordPermission(deps: RecordPermissionDeps): Promise<boolean>;

package/dist/native/ensure-record-permission.js ADDED Viewed

@@ -0,0 +1,11 @@
+"use strict";
+Object.defineProperty(exports, "__esModule", { value: true });
+exports.ensureRecordPermission = ensureRecordPermission;
+async function ensureRecordPermission(deps) {
+    // iOS handles the prompt natively inside startCapture.
+    if (deps.os !== 'android')
+        return true;
+    if (await deps.check())
+        return true;
+    return deps.request();
+}

package/dist/services/RealtimeService.js CHANGED Viewed

@@ -129,6 +129,17 @@ class RealtimeService {
     }
     async startAudioPipeline() {
         try {
+            // Android needs the RECORD_AUDIO runtime permission requested explicitly
+            // before capture (iOS prompts natively inside startCapture). Without this
+            // capture starts denied and the voice stream is silent.
+            const micGranted = await QafkaAudio_1.QafkaAudio.ensureRecordPermission();
+            if (!micGranted) {
+                this.eventHandler?.({
+                    type: 'error',
+                    message: 'Microphone permission denied',
+                });
+                return;
+            }
             // Attach listener BEFORE startCapture so the native tap
             // doesn't drop early buffers (hasListeners/listenerCount gate).
             this.attachAudioListener();

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@qafka/react-native",
-  "version": "2.3.2",
+  "version": "2.3.4",
   "description": "Drop-in AI assistant for React Native: chat, voice, and tool execution with screen-aware navigation.",
   "main": "./dist/index.js",
   "types": "./dist/index.d.ts",