npm - @trustchex/react-native-sdk - Versions diffs - 1.362.4 → 1.374.0 - Mend

@trustchex/react-native-sdk 1.362.4 → 1.374.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (32) hide show

package/TrustchexSDK.podspec CHANGED Viewed

@@ -19,9 +19,9 @@ Pod::Spec.new do |s|
   s.public_header_files = "ios/OpenCV/OpenCVHelper.h"
   # ML Kit dependencies
-  s.dependency "GoogleMLKit/TextRecognition"
-  s.dependency "GoogleMLKit/FaceDetection"
-  s.dependency "GoogleMLKit/BarcodeScanning"
+  s.dependency "GoogleMLKit/TextRecognition", "~> 9.0"
+  s.dependency "GoogleMLKit/FaceDetection", "~> 9.0"
+  s.dependency "GoogleMLKit/BarcodeScanning", "~> 9.0"
   # OpenCV dependency
   s.dependency "OpenCV", "~> 4.3.0"

package/android/build.gradle CHANGED Viewed

@@ -83,9 +83,9 @@ dependencies {
   implementation "androidx.camera:camera-video:1.4.0"
   // Google ML Kit dependencies
-  implementation 'com.google.mlkit:text-recognition:16.0.1'
-  implementation 'com.google.mlkit:face-detection:16.1.7'
-  implementation 'com.google.mlkit:barcode-scanning:17.3.0'
+  implementation 'com.google.mlkit:text-recognition:16.0.0'
+  implementation 'com.google.mlkit:face-detection:16.1.5'
+  implementation 'com.google.mlkit:barcode-scanning:17.1.0'
   // Google Play Services dependency for Tasks
   implementation 'com.google.android.gms:play-services-tasks:18.2.0'

package/android/src/main/java/com/trustchex/reactnativesdk/camera/TrustchexCameraView.kt CHANGED Viewed

@@ -44,10 +44,10 @@ class TrustchexCameraView(context: ThemedReactContext) : FrameLayout(context) {
     // ==================================================================================
     // PORTRAIT-ONLY CAMERA VIEW
     // All camera use cases are locked to ROTATION_0 (portrait) orientation.
-    // Preview: 720x1280 (Portrait HD)
-    // ImageAnalysis: 720x1280 (Portrait HD for ML Kit)
-    // ImageCapture: 720x1280 (Portrait HD for frame capture during recording)
-    // VideoCapture: Quality.HD (CameraX auto-selects portrait HD resolution)
+    // Supports two resolutions:
+    //   - HD: 720x1280 (portrait HD) - lower bandwidth, faster processing
+    //   - Full HD: 1080x1920 (portrait Full HD, default) - sharp text/document capture
+    // Selection criteria: use Full HD for document scanning, HD for real-time detection
     // Activity must be locked to portrait in AndroidManifest.xml
     // ==================================================================================
@@ -69,6 +69,7 @@ class TrustchexCameraView(context: ThemedReactContext) : FrameLayout(context) {
     private var torchEnabled = false
     private var frameProcessingEnabled = false
     private var targetFps = 10
+    private var resolution = "fullhd" // "hd" (720x1280) or "fullhd" (1080x1920, default)
     private var isCameraInitialized = false
     private var isStoppingRecording = false // Track if stopRecording was called to prevent cancelRecording from deleting the file
@@ -80,6 +81,8 @@ class TrustchexCameraView(context: ThemedReactContext) : FrameLayout(context) {
     // ML Kit detector instances (lazy, created once)
     private val textRecognizer by lazy {
+        // Use DEFAULT_OPTIONS for best accuracy with Latin scripts (including MRZ)
+        // ML Kit Text Recognition v2 provides superior accuracy for document scanning
         TextRecognition.getClient(TextRecognizerOptions.DEFAULT_OPTIONS)
     }
     private val faceDetector by lazy {
@@ -202,6 +205,14 @@ class TrustchexCameraView(context: ThemedReactContext) : FrameLayout(context) {
         targetFps = fps.coerceIn(1, 30)
     }
+    fun setResolution(res: String) {
+        // Accept "hd" or "fullhd" (default "fullhd" for 1080x1920)
+        resolution = if (res.lowercase() == "hd") "hd" else "fullhd"
+        if (isCameraInitialized) {
+            initializeCamera()
+        }
+    }
     fun setFaceDetectionEnabled(enabled: Boolean) {
         faceDetectionEnabled = enabled
     }
@@ -238,14 +249,12 @@ class TrustchexCameraView(context: ThemedReactContext) : FrameLayout(context) {
         provider.unbindAll()
         try {
-            // Determine resolution based on camera type
-            // Front camera (liveness): HD (720x1280) for optimal performance
-            // Back camera (documents): Full HD (1080x1920) for sharp document capture
-            val isFrontCamera = cameraSelector == CameraSelector.DEFAULT_FRONT_CAMERA
-            val targetResolution = if (isFrontCamera) {
-                Size(720, 1280) // Portrait HD for front camera
-            } else {
-                Size(1080, 1920) // Portrait Full HD for back camera
+            // Determine resolution based on configured resolution setting
+            // "hd": 720x1280 (lower bandwidth, faster processing)
+            // "fullhd": 1080x1920 (default - sharp text/document capture)
+            val targetResolution = when (resolution.lowercase()) {
+                "hd" -> Size(720, 1280)     // Portrait HD
+                else -> Size(1080, 1920)    // Portrait Full HD (default)
             }
             // Preview use case
@@ -273,9 +282,13 @@ class TrustchexCameraView(context: ThemedReactContext) : FrameLayout(context) {
             // Removing it allows us to bind VideoCapture + Analyzer + Preview simultaneously
             // within the 3-use-case limit of many Android devices.
-            // Video capture use case — PORTRAIT HD
+            // Video capture use case — select quality based on resolution setting
+            val videoQuality = when (resolution.lowercase()) {
+                "hd" -> Quality.HD       // 720x1280
+                else -> Quality.FHD      // 1080x1920 (Full HD, default)
+            }
             val recorder = Recorder.Builder()
-                .setQualitySelector(QualitySelector.from(Quality.HD))
+                .setQualitySelector(QualitySelector.from(videoQuality))
                 .build()
             videoCapture = VideoCapture.withOutput(recorder)
@@ -351,6 +364,12 @@ class TrustchexCameraView(context: ThemedReactContext) : FrameLayout(context) {
                 return
             }
+            // ML Kit Performance Optimization Tips Applied:
+            // 1. Throttle detector calls using STRATEGY_KEEP_ONLY_LATEST backpressure
+            // 2. Drop frames if detector is still busy (prevents queue buildup)
+            // 3. Process at lower resolution (720x1280 portrait) for real-time detection
+            // 4. Use ImageAnalysis.STRATEGY_KEEP_ONLY_LATEST for frame dropping
+            // 5. Close ImageProxy immediately after ML Kit processing completes
             val hasAnyDetection = frameProcessingEnabled && (faceDetectionEnabled || textRecognitionEnabled || barcodeScanningEnabled)
             if (!hasAnyDetection) {
                 isProcessing.set(false)
@@ -363,9 +382,6 @@ class TrustchexCameraView(context: ThemedReactContext) : FrameLayout(context) {
             // Create InputImage directly from camera frame — zero-copy, no base64 for ML Kit
             val inputImage = InputImage.fromMediaImage(mediaImage, rotationDegrees)
-            // Use original image for text recognition
-            val textInputImage = inputImage
             // Calculate portrait-oriented dimensions early (JPEG is already rotated)
             val isRotated = rotationDegrees == 90 || rotationDegrees == 270
@@ -376,6 +392,10 @@ class TrustchexCameraView(context: ThemedReactContext) : FrameLayout(context) {
             // Brightness calculation restricted to scanning frame area (between 36% from top and 36% from bottom, 5% margins on sides)
             val averageBrightness = computeYPlaneBrightness(imageProxy, reportedWidth, reportedHeight)
+            // Use original inputImage directly for text recognition
+            // ML Kit works best with native camera frames, not processed bitmaps
+            val textInputImage = inputImage
             // Generate JPEG base64 only when JS side explicitly needs the image
             // NOTE: Do NOT auto-generate for face detection - too expensive, causes frame drops
             val jpegBase64: String? = if (includeBase64) {
@@ -390,6 +410,9 @@ class TrustchexCameraView(context: ThemedReactContext) : FrameLayout(context) {
             } else null
             val textTask = if (textRecognitionEnabled) {
+                if (!frameProcessingEnabled) {
+                    android.util.Log.w("TrustchexCamera", "Text recognition enabled but frame processing disabled!")
+                }
                 textRecognizer.process(textInputImage).also { tasks.add(it) }
             } else null
@@ -398,6 +421,7 @@ class TrustchexCameraView(context: ThemedReactContext) : FrameLayout(context) {
             } else null
             // Wait for all detectors, then build + send a single event to JS
+            // ML Kit resource cleanup: InputImage is automatically cleaned after task completion
             Tasks.whenAllComplete(tasks).addOnCompleteListener { _ ->
                 try {
                     val frameData = Arguments.createMap()
@@ -451,6 +475,9 @@ class TrustchexCameraView(context: ThemedReactContext) : FrameLayout(context) {
                         if (textTask.isSuccessful) {
                             val result = textTask.result
                             frameData.putString("resultText", result.text)
+                            if (result.text.isNotEmpty()) {
+                                android.util.Log.d("TrustchexCamera", "✓ Text recognized: length=${result.text.length}")
+                            }
                             val blocksArray = Arguments.createArray()
                             for (block in result.textBlocks) {
@@ -471,6 +498,7 @@ class TrustchexCameraView(context: ThemedReactContext) : FrameLayout(context) {
                             }
                             frameData.putArray("textBlocks", blocksArray)
                         } else {
+                            android.util.Log.d("TrustchexCamera", "⚠ Text recognition failed")
                             frameData.putString("resultText", "")
                             frameData.putArray("textBlocks", Arguments.createArray())
                         }
@@ -581,6 +609,32 @@ class TrustchexCameraView(context: ThemedReactContext) : FrameLayout(context) {
         return if (count > 0) sum.toDouble() / count else 0.0
     }
+    /**
+     * Validates if the image dimensions are suitable for ML Kit text recognition.
+     *
+     * ML Kit text recognition requirements:
+     * - Minimum 16x16 pixels per character for acceptable accuracy
+     * - Ideal: 16-24 pixels per character for optimal performance
+     * - At 720x1280 (portrait HD), assuming ~30px average character width:
+     *   - Can fit ~24 characters per line (720/30)
+     *   - Can fit ~42 lines (1280/30)
+     *
+     * @return quality score (0.0-1.0) where 1.0 is optimal
+     */
+    private fun calculateTextRecognitionQuality(width: Int, height: Int): Double {
+        // For text at typical font sizes, we want at least 720px width
+        // Quality decreases significantly below 640px
+        val pixelScore = when {
+            width >= 720 && height >= 1280 -> 1.0  // Optimal
+            width >= 640 && height >= 960 -> 0.85   // Good
+            width >= 480 && height >= 640 -> 0.65   // Acceptable
+            else -> 0.4                              // Poor
+        }
+        return pixelScore
+    }
     private fun yuvImageProxyToJpegBase64(imageProxy: ImageProxy, rotationDegrees: Int): String? {
         try {
             val width = imageProxy.width

package/ios/Camera/TrustchexCameraView.swift CHANGED Viewed

@@ -30,6 +30,14 @@ class TrustchexCameraView: UIView {
             }
         }
     }
+    @objc var resolution: String = "fullhd" {
+        didSet {
+            if resolution != oldValue {
+                // \"hd\" or \"fullhd\" - reinitialize camera with new resolution
+                setupCamera()
+            }
+        }
+    }
     @objc var torchEnabled: Bool = false {
         didSet {
             if torchEnabled != oldValue {
@@ -114,27 +122,23 @@ class TrustchexCameraView: UIView {
         // Add video input
         let cameraPosition: AVCaptureDevice.Position = (_cameraType == "front") ? .front : .back
-        // Set quality based on camera type
-        // Front camera (liveness): Full HD (1920x1080) for high-quality face detection
-        // Back camera (documents): Full HD (1920x1080) for sharp document capture
-        if cameraPosition == .front {
-            // Front camera: Use Full HD for high-quality liveness detection
-            if session.canSetSessionPreset(.hd1920x1080) {
-                session.sessionPreset = .hd1920x1080
-            } else if session.canSetSessionPreset(.hd1280x720) {
-                session.sessionPreset = .hd1280x720
-            } else {
-                session.sessionPreset = .high
-            }
+        // Set quality based on resolution setting
+        // \"hd\": 720x1280 (HD) - lower bandwidth, faster processing
+        // \"fullhd\": 1920x1080 (Full HD, default) - sharp text/document capture
+        let sessionPreset: AVCaptureSession.Preset
+        if resolution.lowercased() == \"hd\" {
+            sessionPreset = .hd1280x720
         } else {
-            // Back camera: Use Full HD for document scanning
-            if session.canSetSessionPreset(.hd1920x1080) {
-                session.sessionPreset = .hd1920x1080
-            } else if session.canSetSessionPreset(.hd1280x720) {
-                session.sessionPreset = .hd1280x720
-            } else {
-                session.sessionPreset = .high
-            }
+            sessionPreset = .hd1920x1080  // Full HD (default)
+        }
+        if session.canSetSessionPreset(sessionPreset) {
+            session.sessionPreset = sessionPreset
+        } else if sessionPreset == .hd1920x1080 && session.canSetSessionPreset(.hd1280x720) {
+            // Fallback from Full HD to HD
+            session.sessionPreset = .hd1280x720
+        } else if session.canSetSessionPreset(.high) {
+            session.sessionPreset = .high
         }
         let camera = selectBestCamera(for: cameraPosition)
         guard let camera = camera,
@@ -418,6 +422,12 @@ class TrustchexCameraView: UIView {
         targetFps = fps
     }
+    @objc(setResolution:)
+    func setResolution(_ res: String) {
+        // \"hd\" (720x1280) or \"fullhd\" (1920x1080, default)
+        resolution = res.lowercased() == \"hd\" ? \"hd\" : \"fullhd\"
+    }
     @objc func setFocusPoint(_ x: NSNumber, _ y: NSNumber) {
         sessionQueue.async { [weak self] in
             guard let camera = self?.currentCamera else { return }
@@ -695,6 +705,12 @@ extension TrustchexCameraView: AVCaptureVideoDataOutputSampleBufferDelegate {
             }
             lastFrameTime = currentTime
+            // ML Kit Performance Optimization Tips Applied (iOS):
+            // 1. alwaysDiscardsLateVideoFrames = true throttles detector calls
+            // 2. Drop frames if detector is still busy (prevents queue buildup)
+            // 3. Process at 1080x1920 (Full HD) for optimal real-time detection
+            // 4. Use synchronous results(in:) API for video frames (Google recommended)
+            // 5. Dispatch to background queue to unblock videoQueue immediately
             // Mark as processing on videoQueue
             isProcessing = true
@@ -733,16 +749,30 @@ extension TrustchexCameraView: AVCaptureVideoDataOutputSampleBufferDelegate {
         let ciImage = CIImage(cvPixelBuffer: pixelBuffer)
         let orientedImage = isBufferLandscape ? ciImage.oriented(.right) : ciImage
-        // Create VisionImage from the oriented CIImage for better text recognition
+        // Compute brightness early for OCR-B enhancement decision
+        let brightness = computeBrightness(from: pixelBuffer, width: portraitWidth, height: portraitHeight)
+        // For text recognition, use original image directly
+        // ML Kit works best with native camera frames
+        let textEnhancedImage = orientedImage
+        // Create VisionImage from the image (enhanced or original) for better text recognition
         // This ensures MLKit processes the image in the correct orientation
-        guard let cgImage = self.ciContext.createCGImage(orientedImage, from: orientedImage.extent) else {
+        guard let cgImage = self.ciContext.createCGImage(textEnhancedImage, from: textEnhancedImage.extent) else {
             resetProcessingState()
             return
         }
         let visionImage = VisionImage(image: UIImage(cgImage: cgImage))
         visionImage.orientation = .up  // Already oriented correctly
-        // Use original image for text recognition
+        // Use image for text recognition
+        // ML Kit text recognition best practices (iOS):
+        // - Requires minimum 16x16 pixels per character (ideal 16-24px per character)
+        // - Input image: 1080x1920 (portrait Full HD) provides excellent accuracy at real-time speed
+        // - Each character at ~30px = 36 characters per line @ 1080px width
+        // - Use synchronous results(in:) API from captureOutput(_:didOutput:from:)
+        // - Set AVCaptureVideoDataOutput.alwaysDiscardsLateVideoFrames = true (throttle)
+        // - Get results then render overlay in single step for optimal performance
         let textVisionImage = visionImage
         // Generate JPEG base64 only when JS side explicitly needs the image
@@ -755,125 +785,114 @@ extension TrustchexCameraView: AVCaptureVideoDataOutputSampleBufferDelegate {
             }
         }
-        // Synchronous processing using a semaphore to keep the buffer locked
-        // This blocks processingQueue, which is fine (we are off videoQueue)
-        let semaphore = DispatchSemaphore(value: 0)
+        // ML Kit Performance Best Practice (iOS):
+        // Use synchronous results(in:) API for video processing instead of async process()
+        // This is Google's recommended approach for real-time video frame processing
+        // Source: https://developers.google.com/ml-kit/vision/barcode-scanning/ios#performance-tips
         var facesArray: [[String: Any]] = []
         var textBlocksArray: [[String: Any]] = []
         var barcodesArray: [[String: Any]] = []
+        // Face detection using synchronous API
         if enableFaceDetection {
-            faceDetector.process(visionImage) { faces, error in
-                if let faces = faces {
-                    for face in faces {
-                        var faceMap: [String: Any] = [:]
-                        let isFront = self._cameraType == "front"
-                        let faceX = isFront ? CGFloat(portraitWidth) - face.frame.origin.x - face.frame.width : face.frame.origin.x
-                        faceMap["bounds"] = [
-                            "x": Int(faceX),
-                            "y": Int(face.frame.origin.y),
-                            "width": Int(face.frame.width),
-                            "height": Int(face.frame.height)
-                        ]
-                        faceMap["yawAngle"] = face.hasHeadEulerAngleY ? Double(face.headEulerAngleY) : 0.0
-                        faceMap["pitchAngle"] = face.hasHeadEulerAngleX ? Double(face.headEulerAngleX) : 0.0
-                        faceMap["rollAngle"] = face.hasHeadEulerAngleZ ? Double(face.headEulerAngleZ) : 0.0
-                        if face.hasTrackingID {
-                            faceMap["trackingId"] = face.trackingID
-                        }
-                        // Only include probability fields when available (matching Android behavior)
-                        if face.hasSmilingProbability {
-                            faceMap["smilingProbability"] = Double(face.smilingProbability)
-                        }
-                        if face.hasLeftEyeOpenProbability {
-                            faceMap["leftEyeOpenProbability"] = Double(face.leftEyeOpenProbability)
-                        }
-                        if face.hasRightEyeOpenProbability {
-                            faceMap["rightEyeOpenProbability"] = Double(face.rightEyeOpenProbability)
-                        }
-                        facesArray.append(faceMap)
+            do {
+                let faces = try faceDetector.results(in: visionImage)
+                for face in faces {
+                    var faceMap: [String: Any] = [:]
+                    let isFront = self._cameraType == "front"
+                    let faceX = isFront ? CGFloat(portraitWidth) - face.frame.origin.x - face.frame.width : face.frame.origin.x
+                    faceMap["bounds"] = [
+                        "x": Int(faceX),
+                        "y": Int(face.frame.origin.y),
+                        "width": Int(face.frame.width),
+                        "height": Int(face.frame.height)
+                    ]
+                    faceMap["yawAngle"] = face.hasHeadEulerAngleY ? Double(face.headEulerAngleY) : 0.0
+                    faceMap["pitchAngle"] = face.hasHeadEulerAngleX ? Double(face.headEulerAngleX) : 0.0
+                    faceMap["rollAngle"] = face.hasHeadEulerAngleZ ? Double(face.headEulerAngleZ) : 0.0
+                    if face.hasTrackingID {
+                        faceMap["trackingId"] = face.trackingID
+                    }
+                    // Only include probability fields when available (matching Android behavior)
+                    if face.hasSmilingProbability {
+                        faceMap["smilingProbability"] = Double(face.smilingProbability)
+                    }
+                    if face.hasLeftEyeOpenProbability {
+                        faceMap["leftEyeOpenProbability"] = Double(face.leftEyeOpenProbability)
                     }
+                    if face.hasRightEyeOpenProbability {
+                        faceMap["rightEyeOpenProbability"] = Double(face.rightEyeOpenProbability)
+                    }
+                    facesArray.append(faceMap)
                 }
-                semaphore.signal()
+            } catch {
+                // Face detection failed - continue with empty array
             }
-        } else {
-            semaphore.signal()
         }
-        // Text recognition
-        let textSemaphore = DispatchSemaphore(value: 0)
+        // Text recognition using synchronous API
+        // On iOS, this completes quickly at 1080x1920 resolution (~100-300ms per frame)
         var resultText = ""
         if enableTextRecognition {
-            textRecognizer.process(textVisionImage) { text, error in
-                if let text = text {
-                    resultText = text.text
-                    for block in text.blocks {
-                        var blockMap: [String: Any] = ["text": block.text]
-                        let bb = block.frame
-                        // When buffer is landscape (1920x1080) but we set orientation to .right,
-                        // ML Kit might still return coordinates in landscape space.
-                        // We need to rotate them to portrait space (1080x1920) to match face detection.
-                        let blockX: Int
-                        let blockY: Int
-                        let blockWidth: Int
-                        let blockHeight: Int
-                        if isBufferLandscape {
-                            // Rotate from landscape (1920x1080) to portrait (1080x1920)
-                            // When rotating 90° clockwise (.right):
-                            // new_x = old_y
-                            // new_y = landscape_width - old_x - width
-                            // new_width = old_height
-                            // new_height = old_width
-                            blockX = Int(bb.origin.y)
-                            blockY = pixelWidth - Int(bb.origin.x) - Int(bb.width)
-                            blockWidth = Int(bb.height)
-                            blockHeight = Int(bb.width)
-                        } else {
-                            // Already portrait, use directly
-                            blockX = Int(bb.origin.x)
-                            blockY = Int(bb.origin.y)
-                            blockWidth = Int(bb.width)
-                            blockHeight = Int(bb.height)
-                        }
-                        blockMap["blockFrame"] = [
-                            "x": blockX,
-                            "y": blockY,
-                            "width": blockWidth,
-                            "height": blockHeight,
-                            "boundingCenterX": blockX + blockWidth / 2,
-                            "boundingCenterY": blockY + blockHeight / 2
-                        ]
-                        textBlocksArray.append(blockMap)
+            do {
+                let text = try textRecognizer.results(in: textVisionImage)
+                resultText = text.text
+                for block in text.blocks {
+                    var blockMap: [String: Any] = ["text": block.text]
+                    let bb = block.frame
+                    // When buffer is landscape (1920x1080) but we set orientation to .right,
+                    // ML Kit might still return coordinates in landscape space.
+                    // We need to rotate them to portrait space (1080x1920) to match face detection.
+                    let blockX: Int
+                    let blockY: Int
+                    let blockWidth: Int
+                    let blockHeight: Int
+                    if isBufferLandscape {
+                        // Rotate from landscape (1920x1080) to portrait (1080x1920)
+                        // When rotating 90° clockwise (.right):
+                        // new_x = old_y
+                        // new_y = landscape_width - old_x - width
+                        // new_width = old_height
+                        // new_height = old_width
+                        blockX = Int(bb.origin.y)
+                        blockY = pixelWidth - Int(bb.origin.x) - Int(bb.width)
+                        blockWidth = Int(bb.height)
+                        blockHeight = Int(bb.width)
+                    } else {
+                        // Already portrait, use directly
+                        blockX = Int(bb.origin.x)
+                        blockY = Int(bb.origin.y)
+                        blockWidth = Int(bb.width)
+                        blockHeight = Int(bb.height)
                     }
+                    blockMap["blockFrame"] = [
+                        "x": blockX,
+                        "y": blockY,
+                        "width": blockWidth,
+                        "height": blockHeight,
+                        "boundingCenterX": blockX + blockWidth / 2,
+                        "boundingCenterY": blockY + blockHeight / 2
+                    ]
+                    textBlocksArray.append(blockMap)
                 }
-                textSemaphore.signal()
+            } catch {
+                // Text recognition failed - continue with empty result
             }
-        } else {
-            textSemaphore.signal()
         }
         // Barcode scanning - use native AVFoundation results (captured via metadata delegate)
         // This is much faster than MLKit barcode scanning
-        let barcodeSemaphore = DispatchSemaphore(value: 0)
         if enableBarcodeScanning {
             // Use the barcodes detected by the native AVCaptureMetadataOutput
             barcodesArray = lastDetectedBarcodes
-            barcodeSemaphore.signal()
-        } else {
-            barcodeSemaphore.signal()
         }
-        // Wait for vision tasks (with timeout to prevent hang)
-        _ = semaphore.wait(timeout: .now() + 2.0)
-        _ = textSemaphore.wait(timeout: .now() + 2.0)
-        // Only compute brightness if we haven't timed out or crashed
-        // Brightness calculation restricted to scanning frame area (between 36% from top and 36% from bottom, 5% margins on sides)
-        let brightness = computeBrightness(from: pixelBuffer, width: portraitWidth, height: portraitHeight)
+        // Brightness was already computed earlier for OCR-B enhancement
+        // No need to recompute here
         let currentTime = CACurrentMediaTime() * 1000 // Convert to milliseconds to match Android
@@ -962,6 +981,35 @@ extension TrustchexCameraView: AVCaptureVideoDataOutputSampleBufferDelegate {
         return Double(sum) / Double(sampleCount)
     }
+    /**
+     * Validates if the image dimensions are suitable for ML Kit text recognition (iOS).
+     *
+     * ML Kit text recognition requirements (iOS):
+     * - Minimum 16x16 pixels per character for acceptable accuracy
+     * - Ideal: 16-24 pixels per character for optimal performance
+     * - At 1080x1920 (portrait Full HD), assuming ~30px average character width:
+     *   - Can fit ~36 characters per line (1080/30)
+     *   - Can fit ~64 lines (1920/30)
+     * - Performance: ~100-300ms per frame at 1080x1920 with asynchronous API
+     *
+     * @return quality score (0.0-1.0) where 1.0 is optimal
+     */
+    private func calculateTextRecognitionQuality(width: Int, height: Int) -> Double {
+        // iOS uses 1080x1920 as standard, so we prefer that
+        let pixelScore: Double
+        switch (width, height) {
+        case (1080..., 1920...):
+            pixelScore = 1.0  // Optimal (Full HD)
+        case (720..., 1280...):
+            pixelScore = 0.85   // Good (HD)
+        case (640..., 960...):
+            pixelScore = 0.65    // Acceptable
+        default:
+            pixelScore = 0.4     // Poor
+        }
+        return pixelScore
+    }
 }
 // MARK: - AVCaptureFileOutputRecordingDelegate
@@ -1131,7 +1179,6 @@ extension TrustchexCameraView: AVCaptureMetadataOutputObjectsDelegate {
         lastDetectedBarcodes = barcodes
     }
 }
 // MARK: - Helper Extensions
 extension Comparable {
     func clamped(to limits: ClosedRange<Self>) -> Self {

package/lib/module/Shared/Components/FaceCamera.js CHANGED Viewed

@@ -264,6 +264,7 @@ const FaceCamera = ({
       includeBase64: true // Enabled to capture photos for liveness steps
       ,
       targetFps: 5,
+      resolution: "hd",
       onFrameAvailable: handleFrame,
       onCameraReady: handleCameraReady,
       onCameraError: handleCameraError