npm - @mleonard9/vin-scanner - Versions diffs - 0.2.8 → 1.0.0 - Mend

@mleonard9/vin-scanner 0.2.8 → 1.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (3) hide show

package/ios/VisionCameraBarcodeScanner.m +23 -12
package/ios/VisionCameraTextRecognition.m +27 -27
package/package.json +1 -1

package/ios/VisionCameraBarcodeScanner.m CHANGED Viewed

@@ -5,7 +5,6 @@
 #import <VisionCamera/Frame.h>
 #import <VisionCamera/SharedArray.h>
 #import <React/RCTBridgeModule.h>
-#import <CoreVideo/CoreVideo.h>
 @import MLKitVision;
 @interface VisionCameraBarcodeScannerPlugin : FrameProcessorPlugin
@@ -59,14 +58,30 @@
         orientation = [self orientationFromValue:orientationOverride fallback:orientation];
     }
-    // Get image dimensions for coordinate transformation
-    CVImageBufferRef imageBuffer = CMSampleBufferGetImageBuffer(buffer);
-    size_t imageHeight = CVPixelBufferGetHeight(imageBuffer);
+    // Fix vertical flip issue on iOS by rotating orientation 180 degrees
+    // This ensures ML Kit processes the image in the correct orientation
+    UIImageOrientation correctedOrientation = orientation;
+    switch (orientation) {
+        case UIImageOrientationUp:
+            correctedOrientation = UIImageOrientationDown;
+            break;
+        case UIImageOrientationDown:
+            correctedOrientation = UIImageOrientationUp;
+            break;
+        case UIImageOrientationLeft:
+            correctedOrientation = UIImageOrientationRight;
+            break;
+        case UIImageOrientationRight:
+            correctedOrientation = UIImageOrientationLeft;
+            break;
+        default:
+            break;
+    }
     // VisionCamera already normalizes orientation per https://react-native-vision-camera.com/docs/guides/orientation,
     // so ML Kit just needs the frame's orientation metadata instead of rotating pixels manually.
     MLKVisionImage *image = [[MLKVisionImage alloc] initWithBuffer:buffer];
-    image.orientation = orientation;
+    image.orientation = correctedOrientation;
     NSMutableArray *detections = [NSMutableArray array];
     __block NSDictionary *resultPayload = @{};
     dispatch_group_t dispatchGroup = dispatch_group_create();
@@ -97,13 +112,9 @@
                 if (boxData != nil) {
                     CGRect frameRect = barcode.frame;
                     const NSUInteger baseIndex = idx * 6;
-                    // Transform Y coordinates to fix vertical flip issue on iOS
-                    // ML Kit returns coordinates in image space, but VisionCamera expects them flipped
-                    float minY = CGRectGetMinY(frameRect);
-                    float maxY = CGRectGetMaxY(frameRect);
-                    float imageHeightFloat = (float)imageHeight;
-                    boxData[baseIndex] = imageHeightFloat - maxY;  // top = height - bottom
-                    boxData[baseIndex + 1] = imageHeightFloat - minY;  // bottom = height - top
+                    // Coordinates are now correct after orientation fix
+                    boxData[baseIndex] = CGRectGetMinY(frameRect);
+                    boxData[baseIndex + 1] = CGRectGetMaxY(frameRect);
                     boxData[baseIndex + 2] = CGRectGetMinX(frameRect);
                     boxData[baseIndex + 3] = CGRectGetMaxX(frameRect);
                     boxData[baseIndex + 4] = CGRectGetWidth(frameRect);

package/ios/VisionCameraTextRecognition.m CHANGED Viewed

@@ -9,7 +9,6 @@
 #import <VisionCamera/VisionCameraProxyHolder.h>
 #import <VisionCamera/Frame.h>
 #import <VisionCamera/SharedArray.h>
-#import <CoreVideo/CoreVideo.h>
 @import MLKitVision;
 @interface VisionCameraTextRecognitionPlugin : FrameProcessorPlugin
@@ -88,13 +87,28 @@
         orientation = [self orientationFromValue:orientationOverride fallback:orientation];
     }
-    // Get image dimensions for coordinate transformation
-    CVImageBufferRef imageBuffer = CMSampleBufferGetImageBuffer(buffer);
-    size_t imageHeight = CVPixelBufferGetHeight(imageBuffer);
-    float imageHeightFloat = (float)imageHeight;
+    // Fix vertical flip issue on iOS by rotating orientation 180 degrees
+    // This ensures ML Kit processes the image in the correct orientation
+    UIImageOrientation correctedOrientation = orientation;
+    switch (orientation) {
+        case UIImageOrientationUp:
+            correctedOrientation = UIImageOrientationDown;
+            break;
+        case UIImageOrientationDown:
+            correctedOrientation = UIImageOrientationUp;
+            break;
+        case UIImageOrientationLeft:
+            correctedOrientation = UIImageOrientationRight;
+            break;
+        case UIImageOrientationRight:
+            correctedOrientation = UIImageOrientationLeft;
+            break;
+        default:
+            break;
+    }
     MLKVisionImage *image = [[MLKVisionImage alloc] initWithBuffer:buffer];
-    image.orientation = orientation;
+    image.orientation = correctedOrientation;
     NSMutableArray *detections = [NSMutableArray array];
     NSMutableArray<NSArray<NSNumber *> *> *boxValues = [NSMutableArray array];
     NSString *language = arguments[@"language"] ?: self.preferredLanguage ?: @"latin";
@@ -112,11 +126,7 @@
             NSString *resultText = result.text;
             for (MLKTextBlock *block in result.blocks) {
                 CGRect blockFrame = block.frame;
-                // Transform Y coordinates to fix vertical flip issue on iOS
-                float blockMinY = CGRectGetMinY(blockFrame);
-                float blockMaxY = CGRectGetMaxY(blockFrame);
-                float blockTransformedMinY = imageHeightFloat - blockMaxY;
-                float blockTransformedMaxY = imageHeightFloat - blockMinY;
+                // Coordinates are now correct after orientation fix
                 if (block.lines.count == 0) {
                     NSMutableDictionary *entry = [[NSMutableDictionary alloc] init];
@@ -125,7 +135,7 @@
                     entry[@"boxIndex"] = @(boxValues.count);
                     [detections addObject:entry];
                     [boxValues addObject:@[
-                        @(blockTransformedMinY), @(blockTransformedMaxY),
+                        @(CGRectGetMinY(blockFrame)), @(CGRectGetMaxY(blockFrame)),
                         @(CGRectGetMinX(blockFrame)), @(CGRectGetMaxX(blockFrame)),
                         @(-1.f), @(-1.f), @(-1.f), @(-1.f),
                         @(-1.f), @(-1.f), @(-1.f), @(-1.f)
@@ -133,11 +143,6 @@
                 }
                 for (MLKTextLine *line in block.lines) {
                     CGRect lineFrame = line.frame;
-                    // Transform Y coordinates for line frame
-                    float lineMinY = CGRectGetMinY(lineFrame);
-                    float lineMaxY = CGRectGetMaxY(lineFrame);
-                    float lineTransformedMinY = imageHeightFloat - lineMaxY;
-                    float lineTransformedMaxY = imageHeightFloat - lineMinY;
                     if (line.elements.count == 0) {
                         NSMutableDictionary *entry = [[NSMutableDictionary alloc] init];
@@ -147,20 +152,15 @@
                         entry[@"boxIndex"] = @(boxValues.count);
                         [detections addObject:entry];
                         [boxValues addObject:@[
-                            @(blockTransformedMinY), @(blockTransformedMaxY),
+                            @(CGRectGetMinY(blockFrame)), @(CGRectGetMaxY(blockFrame)),
                             @(CGRectGetMinX(blockFrame)), @(CGRectGetMaxX(blockFrame)),
-                            @(lineTransformedMinY), @(lineTransformedMaxY),
+                            @(CGRectGetMinY(lineFrame)), @(CGRectGetMaxY(lineFrame)),
                             @(CGRectGetMinX(lineFrame)), @(CGRectGetMaxX(lineFrame)),
                             @(-1.f), @(-1.f), @(-1.f), @(-1.f)
                         ]];
                     }
                     for (MLKTextElement *element in line.elements) {
                         CGRect elementFrame = element.frame;
-                        // Transform Y coordinates for element frame
-                        float elementMinY = CGRectGetMinY(elementFrame);
-                        float elementMaxY = CGRectGetMaxY(elementFrame);
-                        float elementTransformedMinY = imageHeightFloat - elementMaxY;
-                        float elementTransformedMaxY = imageHeightFloat - elementMinY;
                         NSMutableDictionary *entry = [[NSMutableDictionary alloc] init];
                         entry[@"resultText"] = resultText ?: (id)kCFNull;
@@ -170,11 +170,11 @@
                         entry[@"boxIndex"] = @(boxValues.count);
                         [detections addObject:entry];
                         [boxValues addObject:@[
-                            @(blockTransformedMinY), @(blockTransformedMaxY),
+                            @(CGRectGetMinY(blockFrame)), @(CGRectGetMaxY(blockFrame)),
                             @(CGRectGetMinX(blockFrame)), @(CGRectGetMaxX(blockFrame)),
-                            @(lineTransformedMinY), @(lineTransformedMaxY),
+                            @(CGRectGetMinY(lineFrame)), @(CGRectGetMaxY(lineFrame)),
                             @(CGRectGetMinX(lineFrame)), @(CGRectGetMaxX(lineFrame)),
-                            @(elementTransformedMinY), @(elementTransformedMaxY),
+                            @(CGRectGetMinY(elementFrame)), @(CGRectGetMaxY(elementFrame)),
                             @(CGRectGetMinX(elementFrame)), @(CGRectGetMaxX(elementFrame))
                         ]];
                     }

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@mleonard9/vin-scanner",
-  "version": "0.2.8",
+  "version": "1.0.0",
   "description": "High-performance VIN scanner for React Native Vision Camera powered by Google ML Kit barcode + text recognition.",
   "main": "lib/commonjs/index",
   "module": "lib/module/index",