npm - vision-camera-face-detection - Versions diffs - 2.1.0 → 2.2.1 - Mend

vision-camera-face-detection 2.1.0 → 2.2.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (24) hide show

package/README.md +2 -2
package/VisionCameraFaceDetection.podspec +1 -1
package/android/build.gradle +0 -1
package/android/gradle.properties +1 -1
package/android/src/main/java/com/visioncamerafacedetection/VisionCameraFaceDetectionPlugin.kt +100 -83
package/android/src/main/java/com/visioncamerafacedetection/VisionCameraFaceDetectorOrientation.kt +57 -0
package/ios/FaceHelper.swift +103 -220
package/ios/VisionCameraFaceDetectionPlugin.swift +326 -306
package/ios/VisionCameraFaceDetectorOrientation.swift +81 -0
package/lib/commonjs/Camera.js +58 -34
package/lib/commonjs/Camera.js.map +1 -1
package/lib/commonjs/FaceDetector.js.map +1 -1
package/lib/module/Camera.js +60 -34
package/lib/module/Camera.js.map +1 -1
package/lib/module/FaceDetector.js.map +1 -1
package/lib/typescript/commonjs/src/Camera.d.ts.map +1 -1
package/lib/typescript/commonjs/src/FaceDetector.d.ts +24 -6
package/lib/typescript/commonjs/src/FaceDetector.d.ts.map +1 -1
package/lib/typescript/module/src/Camera.d.ts.map +1 -1
package/lib/typescript/module/src/FaceDetector.d.ts +24 -6
package/lib/typescript/module/src/FaceDetector.d.ts.map +1 -1
package/package.json +6 -7
package/src/Camera.tsx +65 -33
package/src/FaceDetector.ts +31 -6

package/ios/VisionCameraFaceDetectionPlugin.swift CHANGED Viewed

@@ -10,330 +10,350 @@ import TensorFlowLite
 @objc(VisionCameraFaceDetectionPlugin)
 public class VisionCameraFaceDetectionPlugin: FrameProcessorPlugin {
-    // device display data
-    private let screenBounds = UIScreen.main.bounds
+  enum CameraFacing: String {
+    case front = "front"
+    case back = "back"
+  }
+  // detection props
+  private var autoMode = false
+  private var faceDetector: FaceDetector! = nil
+  private var runLandmarks = false
+  private var runClassifications = false
+  private var runContours = false
+  private var trackingEnabled = false
+  private var windowWidth = 1.0
+  private var windowHeight = 1.0
+  private var cameraFacing:AVCaptureDevice.Position = .front
+  private var orientationManager = VisionCameraFaceDetectorOrientation()
+  private var enableTensor = false
+  public override init(
+    proxy: VisionCameraProxyHolder,
+    options: [AnyHashable : Any]! = [:]
+  ) {
+    super.init(proxy: proxy, options: options)
+    let config = getConfig(withArguments: options)
-    // detection props
-    private var autoScale = false
-    private var faceDetector: FaceDetector! = nil
-    private var runLandmarks = false
-    private var runClassifications = false
-    private var runContours = false
-    private var trackingEnabled = false
-    private var enableTensor = false
+    let windowWidthParam = config?["windowWidth"] as? Double
+    if windowWidthParam != nil && windowWidthParam != windowWidth {
+      windowWidth = CGFloat(windowWidthParam!)
+    }
-    public override init(
-        proxy: VisionCameraProxyHolder,
-        options: [AnyHashable : Any]! = [:]
-    ) {
-        super.init(proxy: proxy, options: options)
-        let config = getConfig(withArguments: options)
-        // handle auto scaling
-        autoScale = config?["autoScale"] as? Bool == true
-        // handle enable/disable tensor
-        enableTensor = config?["enableTensor"] as? Bool == true
-        // initializes faceDetector on creation
-        let minFaceSize = 0.15
-        let optionsBuilder = FaceDetectorOptions()
-        optionsBuilder.performanceMode = .fast
-        optionsBuilder.landmarkMode = .none
-        optionsBuilder.contourMode = .none
-        optionsBuilder.classificationMode = .none
-        optionsBuilder.minFaceSize = minFaceSize
-        optionsBuilder.isTrackingEnabled = false
-        if config?["performanceMode"] as? String == "accurate" {
-            optionsBuilder.performanceMode = .accurate
-        }
-        if config?["landmarkMode"] as? String == "all" {
-            runLandmarks = true
-            optionsBuilder.landmarkMode = .all
-        }
-        if config?["classificationMode"] as? String == "all" {
-            runClassifications = true
-            optionsBuilder.classificationMode = .all
-        }
-        if config?["contourMode"] as? String == "all" {
-            runContours = true
-            optionsBuilder.contourMode = .all
-        }
-        let minFaceSizeParam = config?["minFaceSize"] as? Double
-        if minFaceSizeParam != nil && minFaceSizeParam != minFaceSize {
-            optionsBuilder.minFaceSize = CGFloat(minFaceSizeParam!)
-        }
-        if config?["trackingEnabled"] as? Bool == true {
-            trackingEnabled = true
-            optionsBuilder.isTrackingEnabled = true
-        }
-        faceDetector = FaceDetector.faceDetector(options: optionsBuilder)
+    let windowHeightParam = config?["windowHeight"] as? Double
+    if windowHeightParam != nil && windowHeightParam != windowHeight {
+      windowHeight = CGFloat(windowHeightParam!)
     }
-    func getConfig(
-        withArguments arguments: [AnyHashable: Any]!
-    ) -> [String:Any]! {
-        if arguments.count > 0 {
-            let config = arguments.map { dictionary in
-                Dictionary(uniqueKeysWithValues: dictionary.map { (key, value) in
-                    (key as? String ?? "", value)
-                })
-            }
-            return config
-        }
-        return nil
+    if config?["cameraFacing"] as? String == "back" {
+      cameraFacing = .back
     }
-    func processBoundingBox(
-        from face: Face,
-        sourceWidth: CGFloat,
-        sourceHeight: CGFloat,
-        orientation: UIImage.Orientation,
-        scaleX: CGFloat,
-        scaleY: CGFloat
-    ) -> [String:Any] {
-        let boundingBox = face.frame
-        let width = boundingBox.width * scaleX
-        let height = boundingBox.height * scaleY
-        let x = boundingBox.origin.y * scaleX
-        let y = boundingBox.origin.x * scaleY
-        return [
-            "width": width,
-            "height": height,
-            "x": (-x + sourceWidth * scaleX) - width,
-            "y": y
-        ]
+    // handle auto scaling and rotation
+    autoMode = config?["autoMode"] as? Bool == true
+    enableTensor = config?["enableTensor"] as? Bool == true
+    // initializes faceDetector on creation
+    let minFaceSize = 0.15
+    let optionsBuilder = FaceDetectorOptions()
+    optionsBuilder.performanceMode = .fast
+    optionsBuilder.landmarkMode = .none
+    optionsBuilder.contourMode = .none
+    optionsBuilder.classificationMode = .none
+    optionsBuilder.minFaceSize = minFaceSize
+    optionsBuilder.isTrackingEnabled = false
+    if config?["performanceMode"] as? String == "accurate" {
+      optionsBuilder.performanceMode = .accurate
     }
-    func processLandmarks(
-        from face: Face,
-        scaleX: CGFloat,
-        scaleY: CGFloat
-    ) -> [String:[String: CGFloat?]] {
-        let faceLandmarkTypes = [
-            FaceLandmarkType.leftCheek,
-            FaceLandmarkType.leftEar,
-            FaceLandmarkType.leftEye,
-            FaceLandmarkType.mouthBottom,
-            FaceLandmarkType.mouthLeft,
-            FaceLandmarkType.mouthRight,
-            FaceLandmarkType.noseBase,
-            FaceLandmarkType.rightCheek,
-            FaceLandmarkType.rightEar,
-            FaceLandmarkType.rightEye
-        ]
-        let faceLandmarksTypesStrings = [
-            "LEFT_CHEEK",
-            "LEFT_EAR",
-            "LEFT_EYE",
-            "MOUTH_BOTTOM",
-            "MOUTH_LEFT",
-            "MOUTH_RIGHT",
-            "NOSE_BASE",
-            "RIGHT_CHEEK",
-            "RIGHT_EAR",
-            "RIGHT_EYE"
-        ];
-        var faceLandMarksTypesMap: [String: [String: CGFloat?]] = [:]
-        for i in 0..<faceLandmarkTypes.count {
-            let landmark = face.landmark(ofType: faceLandmarkTypes[i]);
-            let position = [
-                "x": landmark?.position.x ?? 0.0 * scaleX,
-                "y": landmark?.position.y ?? 0.0 * scaleY
-            ]
-            faceLandMarksTypesMap[faceLandmarksTypesStrings[i]] = position
+    if config?["landmarkMode"] as? String == "all" {
+      runLandmarks = true
+      optionsBuilder.landmarkMode = .all
+    }
+    if config?["classificationMode"] as? String == "all" {
+      runClassifications = true
+      optionsBuilder.classificationMode = .all
+    }
+    if config?["contourMode"] as? String == "all" {
+      runContours = true
+      optionsBuilder.contourMode = .all
+    }
+    let minFaceSizeParam = config?["minFaceSize"] as? Double
+    if minFaceSizeParam != nil && minFaceSizeParam != minFaceSize {
+      optionsBuilder.minFaceSize = CGFloat(minFaceSizeParam!)
+    }
+    if config?["trackingEnabled"] as? Bool == true {
+      trackingEnabled = true
+      optionsBuilder.isTrackingEnabled = true
+    }
+    faceDetector = FaceDetector.faceDetector(options: optionsBuilder)
+  }
+  func getConfig(
+    withArguments arguments: [AnyHashable: Any]!
+  ) -> [String:Any]! {
+    if arguments.count > 0 {
+      let config = arguments.map { dictionary in
+        Dictionary(uniqueKeysWithValues: dictionary.map { (key, value) in
+          (key as? String ?? "", value)
+        })
+      }
+      return config
+    }
+    return nil
+  }
+  func processBoundingBox(
+    from face: Face,
+    sourceWidth: CGFloat,
+    sourceHeight: CGFloat,
+    scaleX: CGFloat,
+    scaleY: CGFloat
+  ) -> [String:Any] {
+    let boundingBox = face.frame
+    let width = boundingBox.width * scaleX
+    let height = boundingBox.height * scaleY
+    // inverted because we also inverted sourceWidth/height
+    let x = boundingBox.origin.y * scaleX
+    let y = boundingBox.origin.x * scaleY
+    if(autoMode) {
+      return [
+        "width": width,
+        "height": height,
+        "x": (-x + sourceWidth * scaleX) - width,
+        "y": y
+      ]
+    }
+    return [
+      "width": width,
+      "height": height,
+      "x": y,
+      "y": x
+    ]
+  }
+  func processLandmarks(
+    from face: Face,
+    scaleX: CGFloat,
+    scaleY: CGFloat
+  ) -> [String:[String: CGFloat?]] {
+    let faceLandmarkTypes = [
+      FaceLandmarkType.leftCheek,
+      FaceLandmarkType.leftEar,
+      FaceLandmarkType.leftEye,
+      FaceLandmarkType.mouthBottom,
+      FaceLandmarkType.mouthLeft,
+      FaceLandmarkType.mouthRight,
+      FaceLandmarkType.noseBase,
+      FaceLandmarkType.rightCheek,
+      FaceLandmarkType.rightEar,
+      FaceLandmarkType.rightEye
+    ]
+    let faceLandmarksTypesStrings = [
+      "LEFT_CHEEK",
+      "LEFT_EAR",
+      "LEFT_EYE",
+      "MOUTH_BOTTOM",
+      "MOUTH_LEFT",
+      "MOUTH_RIGHT",
+      "NOSE_BASE",
+      "RIGHT_CHEEK",
+      "RIGHT_EAR",
+      "RIGHT_EYE"
+    ];
+    var faceLandMarksTypesMap: [String: [String: CGFloat?]] = [:]
+    for i in 0..<faceLandmarkTypes.count {
+      let landmark = face.landmark(ofType: faceLandmarkTypes[i]);
+      let position = [
+        "x": landmark?.position.x ?? 0.0 * scaleX,
+        "y": landmark?.position.y ?? 0.0 * scaleY
+      ]
+      faceLandMarksTypesMap[faceLandmarksTypesStrings[i]] = position
+    }
+    return faceLandMarksTypesMap
+  }
+  func processFaceContours(
+    from face: Face,
+    scaleX: CGFloat,
+    scaleY: CGFloat
+  ) -> [String:[[String:CGFloat]]] {
+    let faceContoursTypes = [
+      FaceContourType.face,
+      FaceContourType.leftCheek,
+      FaceContourType.leftEye,
+      FaceContourType.leftEyebrowBottom,
+      FaceContourType.leftEyebrowTop,
+      FaceContourType.lowerLipBottom,
+      FaceContourType.lowerLipTop,
+      FaceContourType.noseBottom,
+      FaceContourType.noseBridge,
+      FaceContourType.rightCheek,
+      FaceContourType.rightEye,
+      FaceContourType.rightEyebrowBottom,
+      FaceContourType.rightEyebrowTop,
+      FaceContourType.upperLipBottom,
+      FaceContourType.upperLipTop
+    ]
+    let faceContoursTypesStrings = [
+      "FACE",
+      "LEFT_CHEEK",
+      "LEFT_EYE",
+      "LEFT_EYEBROW_BOTTOM",
+      "LEFT_EYEBROW_TOP",
+      "LOWER_LIP_BOTTOM",
+      "LOWER_LIP_TOP",
+      "NOSE_BOTTOM",
+      "NOSE_BRIDGE",
+      "RIGHT_CHEEK",
+      "RIGHT_EYE",
+      "RIGHT_EYEBROW_BOTTOM",
+      "RIGHT_EYEBROW_TOP",
+      "UPPER_LIP_BOTTOM",
+      "UPPER_LIP_TOP"
+    ];
+    var faceContoursTypesMap: [String:[[String:CGFloat]]] = [:]
+    for i in 0..<faceContoursTypes.count {
+      let contour = face.contour(ofType: faceContoursTypes[i]);
+      var pointsArray: [[String:CGFloat]] = []
+      if let points = contour?.points {
+        for point in points {
+          let currentPointsMap = [
+            "x": point.x * scaleX,
+            "y": point.y * scaleY,
+          ]
+          pointsArray.append(currentPointsMap)
         }
-        return faceLandMarksTypesMap
+        faceContoursTypesMap[faceContoursTypesStrings[i]] = pointsArray
+      }
+    }
+    return faceContoursTypesMap
+  }
+  func getImageOrientation() -> UIImage.Orientation {
+    switch orientationManager.orientation {
+    case .portrait:
+      return cameraFacing == .front ? .leftMirrored : .right
+    case .landscapeLeft:
+      return cameraFacing == .front ? .upMirrored : .up
+    case .portraitUpsideDown:
+      return cameraFacing == .front ? .rightMirrored : .left
+    case .landscapeRight:
+      return cameraFacing == .front ? .downMirrored : .down
+    @unknown default:
+      return .up
     }
+  }
+  public override func callback(
+    _ frame: Frame,
+    withArguments arguments: [AnyHashable: Any]?
+  ) -> Any? {
+    var result: [Any] = []
-    func processFaceContours(
-        from face: Face,
-        scaleX: CGFloat,
-        scaleY: CGFloat
-    ) -> [String:[[String:CGFloat]]] {
-        let faceContoursTypes = [
-            FaceContourType.face,
-            FaceContourType.leftCheek,
-            FaceContourType.leftEye,
-            FaceContourType.leftEyebrowBottom,
-            FaceContourType.leftEyebrowTop,
-            FaceContourType.lowerLipBottom,
-            FaceContourType.lowerLipTop,
-            FaceContourType.noseBottom,
-            FaceContourType.noseBridge,
-            FaceContourType.rightCheek,
-            FaceContourType.rightEye,
-            FaceContourType.rightEyebrowBottom,
-            FaceContourType.rightEyebrowTop,
-            FaceContourType.upperLipBottom,
-            FaceContourType.upperLipTop
-        ]
+    do {
+      // we need to invert sizes as frame is always -90deg rotated
+      let width = CGFloat(frame.height)
+      let height = CGFloat(frame.width)
+      let image = VisionImage(buffer: frame.buffer)
+      image.orientation = getImageOrientation()
+      var scaleX:CGFloat
+      var scaleY:CGFloat
+      if (autoMode) {
+        scaleX = windowWidth / width
+        scaleY = windowHeight / height
+      } else {
+        scaleX = CGFloat(1)
+        scaleY = CGFloat(1)
+      }
+      let faces: [Face] = try faceDetector!.results(in: image)
+      for face in faces {
+        var map: [String: Any] = [:]
+        if enableTensor {
+          guard let imageCrop = FaceHelper.getImageFaceFromBuffer(from: frame.buffer, rectImage: face.frame, orientation: image.orientation) else {
+            return nil
+          }
+          guard let rgbData = FaceHelper.rgbDataFromBuffer(imageCrop) else {
+            return nil
+          }
+          try interpreter?.copy(rgbData, toInputAt: 0)
+          try interpreter?.invoke()
+          let outputTensor: Tensor? = try interpreter?.output(at: 0)
+          if ((outputTensor?.data) != nil) {
+            let result: [Float] = [Float32](unsafeData: outputTensor!.data) ?? []
+            map["data"] = result
+          } else {
+            map["data"] = []
+          }
+        } else {
+          map["data"] = []
+        }
-        let faceContoursTypesStrings = [
-            "FACE",
-            "LEFT_CHEEK",
-            "LEFT_EYE",
-            "LEFT_EYEBROW_BOTTOM",
-            "LEFT_EYEBROW_TOP",
-            "LOWER_LIP_BOTTOM",
-            "LOWER_LIP_TOP",
-            "NOSE_BOTTOM",
-            "NOSE_BRIDGE",
-            "RIGHT_CHEEK",
-            "RIGHT_EYE",
-            "RIGHT_EYEBROW_BOTTOM",
-            "RIGHT_EYEBROW_TOP",
-            "UPPER_LIP_BOTTOM",
-            "UPPER_LIP_TOP"
-        ];
+        if runLandmarks {
+          map["landmarks"] = processLandmarks(
+            from: face,
+            scaleX: scaleX,
+            scaleY: scaleY
+          )
+        }
-        var faceContoursTypesMap: [String:[[String:CGFloat]]] = [:]
-        for i in 0..<faceContoursTypes.count {
-            let contour = face.contour(ofType: faceContoursTypes[i]);
-            var pointsArray: [[String:CGFloat]] = []
-            if let points = contour?.points {
-                for point in points {
-                    let currentPointsMap = [
-                        "x": point.x * scaleX,
-                        "y": point.y * scaleY,
-                    ]
-                    pointsArray.append(currentPointsMap)
-                }
-                faceContoursTypesMap[faceContoursTypesStrings[i]] = pointsArray
-            }
+        if runClassifications {
+          map["leftEyeOpenProbability"] = face.leftEyeOpenProbability
+          map["rightEyeOpenProbability"] = face.rightEyeOpenProbability
+          map["smilingProbability"] = face.smilingProbability
         }
-        return faceContoursTypesMap
-    }
-    func getOrientation(
-        orientation: UIImage.Orientation
-    ) -> UIImage.Orientation {
-        switch orientation {
-        case .up:
-            // device is landscape left
-            return .up
-        case .left:
-            // device is portrait
-            return .right
-        case .down:
-            // device is landscape right
-            return .down
-        case .right:
-            // device is upside-down
-            return .left
-        default:
-            return .up
+        if runContours {
+          map["contours"] = processFaceContours(
+            from: face,
+            scaleX: scaleX,
+            scaleY: scaleY
+          )
         }
-    }
-    public override func callback(
-        _ frame: Frame,
-        withArguments arguments: [AnyHashable: Any]?
-    ) -> Any? {
-        var result: [Any] = []
-        do {
-            // we need to invert sizes as frame is always -90deg rotated
-            let width = CGFloat(frame.height)
-            let height = CGFloat(frame.width)
-            let orientation = getOrientation(
-                orientation: frame.orientation
-            )
-            let image = VisionImage(buffer: frame.buffer)
-            image.orientation = orientation
-            var scaleX:CGFloat
-            var scaleY:CGFloat
-            if autoScale {
-                scaleX = screenBounds.size.width / width
-                scaleY = screenBounds.size.height / height
-            } else {
-                scaleX = CGFloat(1)
-                scaleY = CGFloat(1)
-            }
-            let faces: [Face] = try faceDetector!.results(in: image)
-            for face in faces {
-                var map: [String: Any] = [:]
-                if enableTensor {
-                    guard let imageCrop = FaceHelper.getImageFaceFromBuffer(from: frame.buffer, rectImage: face.frame, orientation: orientation) else {
-                        return nil
-                    }
-                    guard let pixelBuffer = FaceHelper.uiImageToPixelBuffer(image: imageCrop, size: inputWidth) else {
-                        return nil
-                    }
-                    guard let rgbData = FaceHelper.rgbDataFromBuffer(pixelBuffer) else {
-                        return nil
-                    }
-                    try interpreter?.copy(rgbData, toInputAt: 0)
-                    try interpreter?.invoke()
-                    let outputTensor: Tensor? = try interpreter?.output(at: 0)
-                    if ((outputTensor?.data) != nil) {
-                        let result: [Float] = [Float32](unsafeData: outputTensor!.data) ?? []
-                        map["data"] = result
-                    } else {
-                        map["data"] = []
-                    }
-                } else {
-                    map["data"] = []
-                }
-                if runLandmarks {
-                    map["landmarks"] = processLandmarks(
-                        from: face,
-                        scaleX: scaleX,
-                        scaleY: scaleY
-                    )
-                }
-                if runClassifications {
-                    map["leftEyeOpenProbability"] = face.leftEyeOpenProbability
-                    map["rightEyeOpenProbability"] = face.rightEyeOpenProbability
-                    map["smilingProbability"] = face.smilingProbability
-                }
-                if runContours {
-                    map["contours"] = processFaceContours(
-                        from: face,
-                        scaleX: scaleX,
-                        scaleY: scaleY
-                    )
-                }
-                if trackingEnabled {
-                    map["trackingId"] = face.trackingID
-                }
-                map["rollAngle"] = face.headEulerAngleZ
-                map["pitchAngle"] = face.headEulerAngleX
-                map["yawAngle"] = face.headEulerAngleY
-                map["bounds"] = processBoundingBox(
-                    from: face,
-                    sourceWidth: width,
-                    sourceHeight: height,
-                    orientation: frame.orientation,
-                    scaleX: scaleX,
-                    scaleY: scaleY
-                )
-                result.append(map)
-            }
-        } catch let error {
-            print("Error processing face detection: \(error)")
+        if trackingEnabled {
+          map["trackingId"] = face.trackingID
         }
-        return result
+        map["rollAngle"] = face.headEulerAngleZ
+        map["pitchAngle"] = face.headEulerAngleX
+        map["yawAngle"] = face.headEulerAngleY
+        map["bounds"] = processBoundingBox(
+          from: face,
+          sourceWidth: width,
+          sourceHeight: height,
+          scaleX: scaleX,
+          scaleY: scaleY
+        )
+        result.append(map)
+      }
+    } catch let error {
+      print("Error processing face detection: \(error)")
     }
+    return result
+  }
 }