react-native-executorch 0.4.10 → 0.5.0-nightly-6f4dd53-20251211
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +77 -71
- package/android/CMakeLists.txt +29 -0
- package/android/build.gradle +76 -13
- package/android/libs/classes.jar +0 -0
- package/android/src/main/cpp/CMakeLists.txt +109 -0
- package/android/src/main/cpp/ETInstallerModule.cpp +76 -0
- package/android/src/main/cpp/ETInstallerModule.h +43 -0
- package/android/src/main/java/com/swmansion/rnexecutorch/ETInstaller.kt +66 -0
- package/android/src/main/java/com/swmansion/rnexecutorch/RnExecutorchPackage.kt +6 -124
- package/common/ada/ada.cpp +17406 -0
- package/common/ada/ada.h +10274 -0
- package/common/pfft/pfft.c +2205 -0
- package/common/pfft/pfft.h +185 -0
- package/common/rnexecutorch/Log.h +489 -0
- package/common/rnexecutorch/RnExecutorchInstaller.cpp +113 -0
- package/common/rnexecutorch/RnExecutorchInstaller.h +87 -0
- package/common/rnexecutorch/TokenizerModule.cpp +52 -0
- package/common/rnexecutorch/TokenizerModule.h +29 -0
- package/common/rnexecutorch/data_processing/FFT.cpp +21 -0
- package/common/rnexecutorch/data_processing/FFT.h +23 -0
- package/common/rnexecutorch/data_processing/FileUtils.h +30 -0
- package/common/rnexecutorch/data_processing/ImageProcessing.cpp +240 -0
- package/common/rnexecutorch/data_processing/ImageProcessing.h +55 -0
- package/common/rnexecutorch/data_processing/Numerical.cpp +111 -0
- package/common/rnexecutorch/data_processing/Numerical.h +77 -0
- package/common/rnexecutorch/data_processing/base64.cpp +110 -0
- package/common/rnexecutorch/data_processing/base64.h +46 -0
- package/common/rnexecutorch/data_processing/dsp.cpp +19 -0
- package/common/rnexecutorch/data_processing/dsp.h +12 -0
- package/common/rnexecutorch/data_processing/gzip.cpp +47 -0
- package/common/rnexecutorch/data_processing/gzip.h +7 -0
- package/common/rnexecutorch/host_objects/JSTensorViewIn.h +12 -0
- package/common/rnexecutorch/host_objects/JSTensorViewOut.h +22 -0
- package/common/rnexecutorch/host_objects/JsiConversions.h +418 -0
- package/common/rnexecutorch/host_objects/ModelHostObject.h +313 -0
- package/common/rnexecutorch/jsi/JsiHostObject.cpp +108 -0
- package/common/rnexecutorch/jsi/JsiHostObject.h +87 -0
- package/common/rnexecutorch/jsi/OwningArrayBuffer.h +57 -0
- package/common/rnexecutorch/jsi/Promise.cpp +20 -0
- package/common/rnexecutorch/jsi/Promise.h +69 -0
- package/common/rnexecutorch/jsi/RuntimeAwareCache.h +58 -0
- package/common/rnexecutorch/jsi/RuntimeLifecycleMonitor.cpp +53 -0
- package/common/rnexecutorch/jsi/RuntimeLifecycleMonitor.h +35 -0
- package/common/rnexecutorch/metaprogramming/ConstructorHelpers.h +133 -0
- package/common/rnexecutorch/metaprogramming/FunctionHelpers.h +50 -0
- package/common/rnexecutorch/metaprogramming/TypeConcepts.h +37 -0
- package/common/rnexecutorch/models/BaseModel.cpp +183 -0
- package/common/rnexecutorch/models/BaseModel.h +61 -0
- package/common/rnexecutorch/models/classification/Classification.cpp +72 -0
- package/common/rnexecutorch/models/classification/Classification.h +31 -0
- package/{ios/RnExecutorch/models/classification/Constants.mm → common/rnexecutorch/models/classification/Constants.h} +7 -2
- package/common/rnexecutorch/models/embeddings/BaseEmbeddings.cpp +19 -0
- package/common/rnexecutorch/models/embeddings/BaseEmbeddings.h +17 -0
- package/common/rnexecutorch/models/embeddings/image/ImageEmbeddings.cpp +45 -0
- package/common/rnexecutorch/models/embeddings/image/ImageEmbeddings.h +28 -0
- package/common/rnexecutorch/models/embeddings/text/TextEmbeddings.cpp +60 -0
- package/common/rnexecutorch/models/embeddings/text/TextEmbeddings.h +31 -0
- package/{ios/RnExecutorch/models/image_segmentation/Constants.mm → common/rnexecutorch/models/image_segmentation/Constants.h} +7 -2
- package/common/rnexecutorch/models/image_segmentation/ImageSegmentation.cpp +168 -0
- package/common/rnexecutorch/models/image_segmentation/ImageSegmentation.h +50 -0
- package/common/rnexecutorch/models/llm/LLM.cpp +98 -0
- package/common/rnexecutorch/models/llm/LLM.h +38 -0
- package/{ios/RnExecutorch/utils/Constants.mm → common/rnexecutorch/models/object_detection/Constants.h} +9 -2
- package/common/rnexecutorch/models/object_detection/ObjectDetection.cpp +82 -0
- package/common/rnexecutorch/models/object_detection/ObjectDetection.h +37 -0
- package/common/rnexecutorch/models/object_detection/Types.h +13 -0
- package/{ios/RnExecutorch/utils/ObjectDetectionUtils.mm → common/rnexecutorch/models/object_detection/Utils.cpp} +17 -35
- package/common/rnexecutorch/models/object_detection/Utils.h +11 -0
- package/common/rnexecutorch/models/ocr/CTCLabelConverter.cpp +88 -0
- package/common/rnexecutorch/models/ocr/CTCLabelConverter.h +29 -0
- package/common/rnexecutorch/models/ocr/Constants.h +41 -0
- package/common/rnexecutorch/models/ocr/Detector.cpp +100 -0
- package/common/rnexecutorch/models/ocr/Detector.h +30 -0
- package/common/rnexecutorch/models/ocr/OCR.cpp +53 -0
- package/common/rnexecutorch/models/ocr/OCR.h +44 -0
- package/common/rnexecutorch/models/ocr/RecognitionHandler.cpp +108 -0
- package/common/rnexecutorch/models/ocr/RecognitionHandler.h +42 -0
- package/common/rnexecutorch/models/ocr/Recognizer.cpp +80 -0
- package/common/rnexecutorch/models/ocr/Recognizer.h +36 -0
- package/common/rnexecutorch/models/ocr/Types.h +35 -0
- package/common/rnexecutorch/models/ocr/utils/DetectorUtils.cpp +710 -0
- package/common/rnexecutorch/models/ocr/utils/DetectorUtils.h +81 -0
- package/common/rnexecutorch/models/ocr/utils/RecognitionHandlerUtils.cpp +159 -0
- package/common/rnexecutorch/models/ocr/utils/RecognitionHandlerUtils.h +72 -0
- package/common/rnexecutorch/models/ocr/utils/RecognizerUtils.cpp +204 -0
- package/common/rnexecutorch/models/ocr/utils/RecognizerUtils.h +71 -0
- package/common/rnexecutorch/models/speech_to_text/SpeechToText.cpp +125 -0
- package/common/rnexecutorch/models/speech_to_text/SpeechToText.h +57 -0
- package/common/rnexecutorch/models/speech_to_text/asr/ASR.cpp +303 -0
- package/common/rnexecutorch/models/speech_to_text/asr/ASR.h +61 -0
- package/common/rnexecutorch/models/speech_to_text/stream/HypothesisBuffer.cpp +82 -0
- package/common/rnexecutorch/models/speech_to_text/stream/HypothesisBuffer.h +25 -0
- package/common/rnexecutorch/models/speech_to_text/stream/OnlineASRProcessor.cpp +99 -0
- package/common/rnexecutorch/models/speech_to_text/stream/OnlineASRProcessor.h +33 -0
- package/common/rnexecutorch/models/speech_to_text/types/DecodingOptions.h +15 -0
- package/common/rnexecutorch/models/speech_to_text/types/GenerationResult.h +12 -0
- package/common/rnexecutorch/models/speech_to_text/types/ProcessResult.h +12 -0
- package/common/rnexecutorch/models/speech_to_text/types/Segment.h +14 -0
- package/common/rnexecutorch/models/speech_to_text/types/Word.h +13 -0
- package/common/rnexecutorch/models/style_transfer/StyleTransfer.cpp +55 -0
- package/common/rnexecutorch/models/style_transfer/StyleTransfer.h +35 -0
- package/common/rnexecutorch/models/text_to_image/Constants.h +9 -0
- package/common/rnexecutorch/models/text_to_image/Decoder.cpp +32 -0
- package/common/rnexecutorch/models/text_to_image/Decoder.h +24 -0
- package/common/rnexecutorch/models/text_to_image/Encoder.cpp +44 -0
- package/common/rnexecutorch/models/text_to_image/Encoder.h +32 -0
- package/common/rnexecutorch/models/text_to_image/Scheduler.cpp +152 -0
- package/common/rnexecutorch/models/text_to_image/Scheduler.h +41 -0
- package/common/rnexecutorch/models/text_to_image/TextToImage.cpp +141 -0
- package/common/rnexecutorch/models/text_to_image/TextToImage.h +64 -0
- package/common/rnexecutorch/models/text_to_image/UNet.cpp +38 -0
- package/common/rnexecutorch/models/text_to_image/UNet.h +28 -0
- package/common/rnexecutorch/models/vertical_ocr/VerticalDetector.cpp +93 -0
- package/common/rnexecutorch/models/vertical_ocr/VerticalDetector.h +49 -0
- package/common/rnexecutorch/models/vertical_ocr/VerticalOCR.cpp +180 -0
- package/common/rnexecutorch/models/vertical_ocr/VerticalOCR.h +85 -0
- package/common/rnexecutorch/models/voice_activity_detection/Constants.h +27 -0
- package/common/rnexecutorch/models/voice_activity_detection/Types.h +12 -0
- package/common/rnexecutorch/models/voice_activity_detection/Utils.cpp +15 -0
- package/common/rnexecutorch/models/voice_activity_detection/Utils.h +13 -0
- package/common/rnexecutorch/models/voice_activity_detection/VoiceActivityDetection.cpp +160 -0
- package/common/rnexecutorch/models/voice_activity_detection/VoiceActivityDetection.h +36 -0
- package/common/rnexecutorch/tests/CMakeLists.txt +30 -0
- package/common/rnexecutorch/tests/LogTest.cpp +530 -0
- package/common/rnexecutorch/tests/NumericalTest.cpp +110 -0
- package/common/rnexecutorch/tests/README.md +37 -0
- package/common/rnexecutorch/threads/GlobalThreadPool.h +84 -0
- package/common/rnexecutorch/threads/HighPerformanceThreadPool.h +364 -0
- package/common/rnexecutorch/threads/utils/ThreadUtils.h +29 -0
- package/common/runner/arange_util.cpp +44 -0
- package/common/runner/arange_util.h +37 -0
- package/common/runner/constants.h +28 -0
- package/common/runner/io_manager.h +240 -0
- package/common/runner/irunner.h +119 -0
- package/common/runner/kernel_includes.h +23 -0
- package/common/runner/runner.cpp +369 -0
- package/common/runner/runner.h +85 -0
- package/common/runner/sampler.cpp +201 -0
- package/common/runner/sampler.h +67 -0
- package/common/runner/stats.h +161 -0
- package/common/runner/text_decoder_runner.cpp +79 -0
- package/common/runner/text_decoder_runner.h +126 -0
- package/common/runner/text_prefiller.cpp +125 -0
- package/common/runner/text_prefiller.h +85 -0
- package/common/runner/text_token_generator.h +205 -0
- package/common/runner/util.h +153 -0
- package/ios/RnExecutorch/ETInstaller.h +8 -0
- package/ios/RnExecutorch/ETInstaller.mm +56 -0
- package/ios/RnExecutorch.xcodeproj/project.pbxproj +73 -23
- package/lib/module/Error.js +3 -0
- package/lib/module/Error.js.map +1 -1
- package/lib/module/common/Logger.js +23 -0
- package/lib/module/common/Logger.js.map +1 -0
- package/lib/module/constants/directories.js +1 -1
- package/lib/module/constants/directories.js.map +1 -1
- package/lib/module/constants/llmDefaults.js +8 -0
- package/lib/module/constants/llmDefaults.js.map +1 -1
- package/lib/module/constants/modelUrls.js +356 -84
- package/lib/module/constants/modelUrls.js.map +1 -1
- package/lib/module/constants/ocr/models.js +181 -286
- package/lib/module/constants/ocr/models.js.map +1 -1
- package/lib/module/constants/ocr/symbols.js +66 -65
- package/lib/module/constants/ocr/symbols.js.map +1 -1
- package/lib/module/controllers/LLMController.js +53 -23
- package/lib/module/controllers/LLMController.js.map +1 -1
- package/lib/module/controllers/OCRController.js +17 -10
- package/lib/module/controllers/OCRController.js.map +1 -1
- package/lib/module/controllers/VerticalOCRController.js +17 -10
- package/lib/module/controllers/VerticalOCRController.js.map +1 -1
- package/lib/module/hooks/computer_vision/useClassification.js +4 -4
- package/lib/module/hooks/computer_vision/useClassification.js.map +1 -1
- package/lib/module/hooks/computer_vision/useImageEmbeddings.js +13 -0
- package/lib/module/hooks/computer_vision/useImageEmbeddings.js.map +1 -0
- package/lib/module/hooks/computer_vision/useImageSegmentation.js +2 -2
- package/lib/module/hooks/computer_vision/useImageSegmentation.js.map +1 -1
- package/lib/module/hooks/computer_vision/useOCR.js +16 -17
- package/lib/module/hooks/computer_vision/useOCR.js.map +1 -1
- package/lib/module/hooks/computer_vision/useObjectDetection.js +3 -3
- package/lib/module/hooks/computer_vision/useObjectDetection.js.map +1 -1
- package/lib/module/hooks/computer_vision/useStyleTransfer.js +3 -3
- package/lib/module/hooks/computer_vision/useStyleTransfer.js.map +1 -1
- package/lib/module/hooks/computer_vision/useTextToImage.js +57 -0
- package/lib/module/hooks/computer_vision/useTextToImage.js.map +1 -0
- package/lib/module/hooks/computer_vision/useVerticalOCR.js +18 -19
- package/lib/module/hooks/computer_vision/useVerticalOCR.js.map +1 -1
- package/lib/module/hooks/general/useExecutorchModule.js +1 -1
- package/lib/module/hooks/general/useExecutorchModule.js.map +1 -1
- package/lib/module/hooks/natural_language_processing/useLLM.js +30 -29
- package/lib/module/hooks/natural_language_processing/useLLM.js.map +1 -1
- package/lib/module/hooks/natural_language_processing/useSpeechToText.js +72 -33
- package/lib/module/hooks/natural_language_processing/useSpeechToText.js.map +1 -1
- package/lib/module/hooks/natural_language_processing/useTextEmbeddings.js +2 -3
- package/lib/module/hooks/natural_language_processing/useTextEmbeddings.js.map +1 -1
- package/lib/module/hooks/natural_language_processing/useTokenizer.js +19 -18
- package/lib/module/hooks/natural_language_processing/useTokenizer.js.map +1 -1
- package/lib/module/hooks/natural_language_processing/useVAD.js +13 -0
- package/lib/module/hooks/natural_language_processing/useVAD.js.map +1 -0
- package/lib/module/hooks/useModule.js +13 -9
- package/lib/module/hooks/useModule.js.map +1 -1
- package/lib/module/index.js +21 -3
- package/lib/module/index.js.map +1 -1
- package/lib/module/modules/BaseModule.js +9 -14
- package/lib/module/modules/BaseModule.js.map +1 -1
- package/lib/module/modules/computer_vision/ClassificationModule.js +11 -6
- package/lib/module/modules/computer_vision/ClassificationModule.js.map +1 -1
- package/lib/module/modules/computer_vision/ImageEmbeddingsModule.js +19 -0
- package/lib/module/modules/computer_vision/ImageEmbeddingsModule.js.map +1 -0
- package/lib/module/modules/computer_vision/ImageSegmentationModule.js +20 -18
- package/lib/module/modules/computer_vision/ImageSegmentationModule.js.map +1 -1
- package/lib/module/modules/computer_vision/OCRModule.js +13 -10
- package/lib/module/modules/computer_vision/OCRModule.js.map +1 -1
- package/lib/module/modules/computer_vision/ObjectDetectionModule.js +11 -6
- package/lib/module/modules/computer_vision/ObjectDetectionModule.js.map +1 -1
- package/lib/module/modules/computer_vision/StyleTransferModule.js +11 -6
- package/lib/module/modules/computer_vision/StyleTransferModule.js.map +1 -1
- package/lib/module/modules/computer_vision/TextToImageModule.js +48 -0
- package/lib/module/modules/computer_vision/TextToImageModule.js.map +1 -0
- package/lib/module/modules/computer_vision/VerticalOCRModule.js +15 -10
- package/lib/module/modules/computer_vision/VerticalOCRModule.js.map +1 -1
- package/lib/module/modules/general/ExecutorchModule.js +8 -34
- package/lib/module/modules/general/ExecutorchModule.js.map +1 -1
- package/lib/module/modules/natural_language_processing/LLMModule.js +25 -24
- package/lib/module/modules/natural_language_processing/LLMModule.js.map +1 -1
- package/lib/module/modules/natural_language_processing/SpeechToTextModule.js +109 -27
- package/lib/module/modules/natural_language_processing/SpeechToTextModule.js.map +1 -1
- package/lib/module/modules/natural_language_processing/TextEmbeddingsModule.js +13 -6
- package/lib/module/modules/natural_language_processing/TextEmbeddingsModule.js.map +1 -1
- package/lib/module/modules/natural_language_processing/TokenizerModule.js +20 -14
- package/lib/module/modules/natural_language_processing/TokenizerModule.js.map +1 -1
- package/lib/module/modules/natural_language_processing/VADModule.js +19 -0
- package/lib/module/modules/natural_language_processing/VADModule.js.map +1 -0
- package/lib/module/native/NativeETInstaller.js +5 -0
- package/lib/module/native/NativeETInstaller.js.map +1 -0
- package/lib/module/native/RnExecutorchModules.js +2 -12
- package/lib/module/native/RnExecutorchModules.js.map +1 -1
- package/lib/module/types/common.js +25 -8
- package/lib/module/types/common.js.map +1 -1
- package/lib/module/types/llm.js.map +1 -1
- package/lib/module/types/stt.js +1 -79
- package/lib/module/types/stt.js.map +1 -1
- package/lib/module/types/vad.js +2 -0
- package/lib/module/types/vad.js.map +1 -0
- package/lib/module/utils/ResourceFetcher.js +275 -114
- package/lib/module/utils/ResourceFetcher.js.map +1 -1
- package/lib/module/utils/ResourceFetcherUtils.js +155 -0
- package/lib/module/utils/ResourceFetcherUtils.js.map +1 -0
- package/lib/module/utils/llm.js +41 -1
- package/lib/module/utils/llm.js.map +1 -1
- package/lib/typescript/Error.d.ts +3 -0
- package/lib/typescript/Error.d.ts.map +1 -1
- package/lib/typescript/common/Logger.d.ts +9 -0
- package/lib/typescript/common/Logger.d.ts.map +1 -0
- package/lib/typescript/constants/llmDefaults.d.ts +1 -0
- package/lib/typescript/constants/llmDefaults.d.ts.map +1 -1
- package/lib/typescript/constants/modelUrls.d.ts +263 -79
- package/lib/typescript/constants/modelUrls.d.ts.map +1 -1
- package/lib/typescript/constants/ocr/models.d.ts +882 -284
- package/lib/typescript/constants/ocr/models.d.ts.map +1 -1
- package/lib/typescript/constants/ocr/symbols.d.ts +1 -1
- package/lib/typescript/constants/ocr/symbols.d.ts.map +1 -1
- package/lib/typescript/controllers/LLMController.d.ts +8 -7
- package/lib/typescript/controllers/LLMController.d.ts.map +1 -1
- package/lib/typescript/controllers/OCRController.d.ts +5 -6
- package/lib/typescript/controllers/OCRController.d.ts.map +1 -1
- package/lib/typescript/controllers/VerticalOCRController.d.ts +5 -6
- package/lib/typescript/controllers/VerticalOCRController.d.ts.map +1 -1
- package/lib/typescript/hooks/computer_vision/useClassification.d.ts +8 -6
- package/lib/typescript/hooks/computer_vision/useClassification.d.ts.map +1 -1
- package/lib/typescript/hooks/computer_vision/useImageEmbeddings.d.ts +16 -0
- package/lib/typescript/hooks/computer_vision/useImageEmbeddings.d.ts.map +1 -0
- package/lib/typescript/hooks/computer_vision/useImageSegmentation.d.ts +5 -3
- package/lib/typescript/hooks/computer_vision/useImageSegmentation.d.ts.map +1 -1
- package/lib/typescript/hooks/computer_vision/useOCR.d.ts +5 -5
- package/lib/typescript/hooks/computer_vision/useOCR.d.ts.map +1 -1
- package/lib/typescript/hooks/computer_vision/useObjectDetection.d.ts +5 -3
- package/lib/typescript/hooks/computer_vision/useObjectDetection.d.ts.map +1 -1
- package/lib/typescript/hooks/computer_vision/useStyleTransfer.d.ts +5 -3
- package/lib/typescript/hooks/computer_vision/useStyleTransfer.d.ts.map +1 -1
- package/lib/typescript/hooks/computer_vision/useTextToImage.d.ts +22 -0
- package/lib/typescript/hooks/computer_vision/useTextToImage.d.ts.map +1 -0
- package/lib/typescript/hooks/computer_vision/useVerticalOCR.d.ts +4 -6
- package/lib/typescript/hooks/computer_vision/useVerticalOCR.d.ts.map +1 -1
- package/lib/typescript/hooks/general/useExecutorchModule.d.ts +1 -1
- package/lib/typescript/hooks/natural_language_processing/useLLM.d.ts +6 -4
- package/lib/typescript/hooks/natural_language_processing/useLLM.d.ts.map +1 -1
- package/lib/typescript/hooks/natural_language_processing/useSpeechToText.d.ts +15 -22
- package/lib/typescript/hooks/natural_language_processing/useSpeechToText.d.ts.map +1 -1
- package/lib/typescript/hooks/natural_language_processing/useTextEmbeddings.d.ts +9 -5
- package/lib/typescript/hooks/natural_language_processing/useTextEmbeddings.d.ts.map +1 -1
- package/lib/typescript/hooks/natural_language_processing/useTokenizer.d.ts +6 -4
- package/lib/typescript/hooks/natural_language_processing/useTokenizer.d.ts.map +1 -1
- package/lib/typescript/hooks/natural_language_processing/useVAD.d.ts +16 -0
- package/lib/typescript/hooks/natural_language_processing/useVAD.d.ts.map +1 -0
- package/lib/typescript/hooks/useModule.d.ts +8 -5
- package/lib/typescript/hooks/useModule.d.ts.map +1 -1
- package/lib/typescript/index.d.ts +26 -3
- package/lib/typescript/index.d.ts.map +1 -1
- package/lib/typescript/modules/BaseModule.d.ts +7 -6
- package/lib/typescript/modules/BaseModule.d.ts.map +1 -1
- package/lib/typescript/modules/computer_vision/ClassificationModule.d.ts +4 -4
- package/lib/typescript/modules/computer_vision/ClassificationModule.d.ts.map +1 -1
- package/lib/typescript/modules/computer_vision/ImageEmbeddingsModule.d.ts +9 -0
- package/lib/typescript/modules/computer_vision/ImageEmbeddingsModule.d.ts.map +1 -0
- package/lib/typescript/modules/computer_vision/ImageSegmentationModule.d.ts +7 -27
- package/lib/typescript/modules/computer_vision/ImageSegmentationModule.d.ts.map +1 -1
- package/lib/typescript/modules/computer_vision/OCRModule.d.ts +8 -7
- package/lib/typescript/modules/computer_vision/OCRModule.d.ts.map +1 -1
- package/lib/typescript/modules/computer_vision/ObjectDetectionModule.d.ts +5 -3
- package/lib/typescript/modules/computer_vision/ObjectDetectionModule.d.ts.map +1 -1
- package/lib/typescript/modules/computer_vision/StyleTransferModule.d.ts +4 -3
- package/lib/typescript/modules/computer_vision/StyleTransferModule.d.ts.map +1 -1
- package/lib/typescript/modules/computer_vision/TextToImageModule.d.ts +16 -0
- package/lib/typescript/modules/computer_vision/TextToImageModule.d.ts.map +1 -0
- package/lib/typescript/modules/computer_vision/VerticalOCRModule.d.ts +7 -8
- package/lib/typescript/modules/computer_vision/VerticalOCRModule.d.ts.map +1 -1
- package/lib/typescript/modules/general/ExecutorchModule.d.ts +4 -7
- package/lib/typescript/modules/general/ExecutorchModule.d.ts.map +1 -1
- package/lib/typescript/modules/natural_language_processing/LLMModule.d.ts +19 -17
- package/lib/typescript/modules/natural_language_processing/LLMModule.d.ts.map +1 -1
- package/lib/typescript/modules/natural_language_processing/SpeechToTextModule.d.ts +17 -13
- package/lib/typescript/modules/natural_language_processing/SpeechToTextModule.d.ts.map +1 -1
- package/lib/typescript/modules/natural_language_processing/TextEmbeddingsModule.d.ts +5 -3
- package/lib/typescript/modules/natural_language_processing/TextEmbeddingsModule.d.ts.map +1 -1
- package/lib/typescript/modules/natural_language_processing/TokenizerModule.d.ts +10 -9
- package/lib/typescript/modules/natural_language_processing/TokenizerModule.d.ts.map +1 -1
- package/lib/typescript/modules/natural_language_processing/VADModule.d.ts +10 -0
- package/lib/typescript/modules/natural_language_processing/VADModule.d.ts.map +1 -0
- package/lib/typescript/native/{NativeStyleTransfer.d.ts → NativeETInstaller.d.ts} +2 -3
- package/lib/typescript/native/NativeETInstaller.d.ts.map +1 -0
- package/lib/typescript/native/RnExecutorchModules.d.ts +3 -23
- package/lib/typescript/native/RnExecutorchModules.d.ts.map +1 -1
- package/lib/typescript/types/common.d.ts +30 -2
- package/lib/typescript/types/common.d.ts.map +1 -1
- package/lib/typescript/types/llm.d.ts +9 -1
- package/lib/typescript/types/llm.d.ts.map +1 -1
- package/lib/typescript/types/stt.d.ts +9 -88
- package/lib/typescript/types/stt.d.ts.map +1 -1
- package/lib/typescript/types/vad.d.ts +5 -0
- package/lib/typescript/types/vad.d.ts.map +1 -0
- package/lib/typescript/utils/ResourceFetcher.d.ts +47 -10
- package/lib/typescript/utils/ResourceFetcher.d.ts.map +1 -1
- package/lib/typescript/utils/ResourceFetcherUtils.d.ts +55 -0
- package/lib/typescript/utils/ResourceFetcherUtils.d.ts.map +1 -0
- package/lib/typescript/utils/llm.d.ts +4 -0
- package/lib/typescript/utils/llm.d.ts.map +1 -1
- package/package.json +32 -68
- package/react-native-executorch.podspec +62 -4
- package/src/Error.ts +3 -0
- package/src/common/Logger.ts +25 -0
- package/src/constants/directories.ts +1 -1
- package/src/constants/llmDefaults.ts +11 -0
- package/src/constants/modelUrls.ts +433 -168
- package/src/constants/ocr/models.ts +826 -395
- package/src/constants/ocr/symbols.ts +66 -65
- package/src/controllers/LLMController.ts +76 -36
- package/src/controllers/OCRController.ts +25 -16
- package/src/controllers/VerticalOCRController.ts +25 -15
- package/src/hooks/computer_vision/useClassification.ts +8 -9
- package/src/hooks/computer_vision/useImageEmbeddings.ts +15 -0
- package/src/hooks/computer_vision/useImageSegmentation.ts +3 -6
- package/src/hooks/computer_vision/useOCR.ts +32 -25
- package/src/hooks/computer_vision/useObjectDetection.ts +4 -7
- package/src/hooks/computer_vision/useStyleTransfer.ts +4 -4
- package/src/hooks/computer_vision/useTextToImage.ts +92 -0
- package/src/hooks/computer_vision/useVerticalOCR.ts +33 -31
- package/src/hooks/general/useExecutorchModule.ts +1 -1
- package/src/hooks/natural_language_processing/useLLM.ts +54 -31
- package/src/hooks/natural_language_processing/useSpeechToText.ts +96 -88
- package/src/hooks/natural_language_processing/useTextEmbeddings.ts +9 -9
- package/src/hooks/natural_language_processing/useTokenizer.ts +21 -21
- package/src/hooks/natural_language_processing/useVAD.ts +15 -0
- package/src/hooks/useModule.ts +23 -13
- package/src/index.ts +126 -0
- package/src/modules/BaseModule.ts +17 -22
- package/src/modules/computer_vision/ClassificationModule.ts +18 -9
- package/src/modules/computer_vision/ImageEmbeddingsModule.ts +26 -0
- package/src/modules/computer_vision/ImageSegmentationModule.ts +34 -26
- package/src/modules/computer_vision/OCRModule.ts +23 -15
- package/src/modules/computer_vision/ObjectDetectionModule.ts +22 -9
- package/src/modules/computer_vision/StyleTransferModule.ts +18 -9
- package/src/modules/computer_vision/TextToImageModule.ts +93 -0
- package/src/modules/computer_vision/VerticalOCRModule.ts +25 -21
- package/src/modules/general/ExecutorchModule.ts +16 -46
- package/src/modules/natural_language_processing/LLMModule.ts +41 -32
- package/src/modules/natural_language_processing/SpeechToTextModule.ts +164 -66
- package/src/modules/natural_language_processing/TextEmbeddingsModule.ts +25 -10
- package/src/modules/natural_language_processing/TokenizerModule.ts +27 -17
- package/src/modules/natural_language_processing/VADModule.ts +27 -0
- package/src/native/NativeETInstaller.ts +8 -0
- package/src/native/RnExecutorchModules.ts +4 -50
- package/src/types/common.ts +40 -12
- package/src/types/llm.ts +10 -0
- package/src/types/stt.ts +87 -90
- package/src/types/vad.ts +4 -0
- package/src/utils/ResourceFetcher.ts +342 -120
- package/src/utils/ResourceFetcherUtils.ts +184 -0
- package/src/utils/llm.ts +65 -1
- package/third-party/android/libs/cpuinfo/arm64-v8a/libcpuinfo.so +0 -0
- package/third-party/android/libs/executorch/arm64-v8a/libexecutorch.so +0 -0
- package/third-party/android/libs/executorch/x86_64/libexecutorch.so +0 -0
- package/third-party/android/libs/opencv/arm64-v8a/libopencv_core.a +0 -0
- package/third-party/android/libs/opencv/arm64-v8a/libopencv_features2d.a +0 -0
- package/third-party/android/libs/opencv/arm64-v8a/libopencv_highgui.a +0 -0
- package/third-party/android/libs/opencv/arm64-v8a/libopencv_imgproc.a +0 -0
- package/third-party/android/libs/opencv/arm64-v8a/libopencv_photo.a +0 -0
- package/third-party/android/libs/opencv/arm64-v8a/libopencv_video.a +0 -0
- package/third-party/android/libs/opencv/x86_64/libopencv_core.a +0 -0
- package/third-party/android/libs/opencv/x86_64/libopencv_features2d.a +0 -0
- package/third-party/android/libs/opencv/x86_64/libopencv_highgui.a +0 -0
- package/third-party/android/libs/opencv/x86_64/libopencv_imgproc.a +0 -0
- package/third-party/android/libs/opencv/x86_64/libopencv_photo.a +0 -0
- package/third-party/android/libs/opencv/x86_64/libopencv_video.a +0 -0
- package/third-party/android/libs/opencv-third-party/arm64-v8a/libkleidicv.a +0 -0
- package/third-party/android/libs/opencv-third-party/arm64-v8a/libkleidicv_hal.a +0 -0
- package/third-party/android/libs/opencv-third-party/arm64-v8a/libkleidicv_thread.a +0 -0
- package/third-party/android/libs/pthreadpool/arm64-v8a/libpthreadpool.so +0 -0
- package/third-party/android/libs/tokenizers-cpp/arm64-v8a/libsentencepiece.a +0 -0
- package/third-party/android/libs/tokenizers-cpp/arm64-v8a/libtokenizers_c.a +0 -0
- package/third-party/android/libs/tokenizers-cpp/arm64-v8a/libtokenizers_cpp.a +0 -0
- package/{ios/ExecutorchLib.xcframework/ios-arm64-simulator/ExecutorchLib.framework/ExecutorchLib → third-party/android/libs/tokenizers-cpp/x86_64/libsentencepiece.a} +0 -0
- package/third-party/android/libs/tokenizers-cpp/x86_64/libtokenizers_c.a +0 -0
- package/third-party/android/libs/tokenizers-cpp/x86_64/libtokenizers_cpp.a +0 -0
- package/third-party/include/c10/macros/Export.h +1 -0
- package/third-party/include/c10/macros/Macros.h +1 -0
- package/third-party/include/c10/util/BFloat16-inl.h +1 -0
- package/third-party/include/c10/util/BFloat16-math.h +266 -0
- package/third-party/include/c10/util/BFloat16.h +1 -0
- package/third-party/include/c10/util/Half-inl.h +1 -0
- package/third-party/include/c10/util/Half.h +8 -0
- package/third-party/include/c10/util/TypeSafeSignMath.h +1 -0
- package/third-party/include/c10/util/bit_cast.h +1 -0
- package/third-party/include/c10/util/complex.h +72 -0
- package/third-party/include/c10/util/complex_math.h +399 -0
- package/third-party/include/c10/util/complex_utils.h +41 -0
- package/third-party/include/c10/util/floating_point_utils.h +1 -0
- package/third-party/include/c10/util/irange.h +107 -0
- package/third-party/include/c10/util/llvmMathExtras.h +866 -0
- package/third-party/include/c10/util/overflows.h +95 -0
- package/third-party/include/c10/util/safe_numerics.h +97 -0
- package/third-party/include/cpuinfo/cpuinfo.h +2305 -0
- package/third-party/include/executorch/ExecuTorch.h +13 -0
- package/third-party/include/executorch/ExecuTorchError.h +90 -0
- package/third-party/include/executorch/ExecuTorchLLM/ExecuTorchLLM.h +12 -0
- package/third-party/include/executorch/ExecuTorchLLM/ExecuTorchLLMConfig.h +56 -0
- package/third-party/include/executorch/ExecuTorchLLM/ExecuTorchLLMError.h +16 -0
- package/third-party/include/executorch/ExecuTorchLLM/ExecuTorchLLMMultimodalRunner.h +227 -0
- package/third-party/include/executorch/ExecuTorchLLM/ExecuTorchLLMTextRunner.h +97 -0
- package/third-party/include/executorch/ExecuTorchLLM/module.modulemap +4 -0
- package/third-party/include/executorch/ExecuTorchLog.h +77 -0
- package/third-party/include/executorch/ExecuTorchModule.h +563 -0
- package/third-party/include/executorch/ExecuTorchTensor.h +1421 -0
- package/third-party/include/executorch/ExecuTorchValue.h +265 -0
- package/third-party/include/executorch/extension/module/bundled_module.h +131 -0
- package/third-party/include/executorch/extension/module/module.h +649 -0
- package/third-party/include/executorch/extension/tensor/tensor.h +14 -0
- package/third-party/include/executorch/extension/tensor/tensor_accessor.h +190 -0
- package/third-party/include/executorch/extension/tensor/tensor_ptr.h +409 -0
- package/third-party/include/executorch/extension/tensor/tensor_ptr_maker.h +653 -0
- package/third-party/include/executorch/extension/threadpool/cpuinfo_utils.h +24 -0
- package/third-party/include/executorch/extension/threadpool/threadpool.h +95 -0
- package/third-party/include/executorch/runtime/backend/backend_execution_context.h +71 -0
- package/third-party/include/executorch/runtime/backend/backend_init_context.h +84 -0
- package/third-party/include/executorch/runtime/backend/backend_option_context.h +34 -0
- package/third-party/include/executorch/runtime/backend/interface.h +227 -0
- package/third-party/include/executorch/runtime/backend/options.h +206 -0
- package/third-party/include/executorch/runtime/core/array_ref.h +235 -0
- package/third-party/include/executorch/runtime/core/data_loader.h +136 -0
- package/third-party/include/executorch/runtime/core/defines.h +20 -0
- package/third-party/include/executorch/runtime/core/error.h +256 -0
- package/third-party/include/executorch/runtime/core/evalue.h +515 -0
- package/third-party/include/executorch/runtime/core/event_tracer.h +580 -0
- package/third-party/include/executorch/runtime/core/event_tracer_hooks.h +332 -0
- package/third-party/include/executorch/runtime/core/event_tracer_hooks_delegate.h +197 -0
- package/third-party/include/executorch/runtime/core/exec_aten/exec_aten.h +170 -0
- package/third-party/include/executorch/runtime/core/exec_aten/util/dim_order_util.h +264 -0
- package/third-party/include/executorch/runtime/core/exec_aten/util/scalar_type_util.h +1313 -0
- package/third-party/include/executorch/runtime/core/exec_aten/util/tensor_dimension_limit.h +21 -0
- package/third-party/include/executorch/runtime/core/exec_aten/util/tensor_shape_to_c_string.h +69 -0
- package/third-party/include/executorch/runtime/core/exec_aten/util/tensor_util.h +1251 -0
- package/third-party/include/executorch/runtime/core/freeable_buffer.h +107 -0
- package/third-party/include/executorch/runtime/core/function_ref.h +100 -0
- package/third-party/include/executorch/runtime/core/hierarchical_allocator.h +107 -0
- package/third-party/include/executorch/runtime/core/memory_allocator.h +208 -0
- package/third-party/include/executorch/runtime/core/named_data_map.h +76 -0
- package/third-party/include/executorch/runtime/core/portable_type/bfloat16.h +27 -0
- package/third-party/include/executorch/runtime/core/portable_type/bfloat16_math.h +14 -0
- package/third-party/include/executorch/runtime/core/portable_type/bits_types.h +83 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/macros/Export.h +1 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/macros/Macros.h +1 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/util/BFloat16-inl.h +1 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/util/BFloat16-math.h +266 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/util/BFloat16.h +1 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/util/Half-inl.h +1 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/util/Half.h +8 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/util/TypeSafeSignMath.h +1 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/util/bit_cast.h +1 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/util/complex.h +72 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/util/complex_math.h +399 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/util/complex_utils.h +41 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/util/floating_point_utils.h +1 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/util/irange.h +107 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/util/llvmMathExtras.h +866 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/util/overflows.h +95 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/util/safe_numerics.h +97 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/torch/headeronly/macros/Export.h +154 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/torch/headeronly/macros/Macros.h +553 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/torch/headeronly/util/BFloat16.h +477 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/torch/headeronly/util/Half.h +781 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/torch/headeronly/util/TypeSafeSignMath.h +141 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/torch/headeronly/util/bit_cast.h +49 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/torch/headeronly/util/complex.h +593 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/torch/headeronly/util/floating_point_utils.h +38 -0
- package/third-party/include/executorch/runtime/core/portable_type/complex.h +21 -0
- package/third-party/include/executorch/runtime/core/portable_type/device.h +70 -0
- package/third-party/include/executorch/runtime/core/portable_type/half.h +27 -0
- package/third-party/include/executorch/runtime/core/portable_type/optional.h +36 -0
- package/third-party/include/executorch/runtime/core/portable_type/qint_types.h +83 -0
- package/third-party/include/executorch/runtime/core/portable_type/scalar.h +110 -0
- package/third-party/include/executorch/runtime/core/portable_type/scalar_type.h +154 -0
- package/third-party/include/executorch/runtime/core/portable_type/string_view.h +29 -0
- package/third-party/include/executorch/runtime/core/portable_type/tensor.h +142 -0
- package/third-party/include/executorch/runtime/core/portable_type/tensor_impl.h +281 -0
- package/third-party/include/executorch/runtime/core/portable_type/tensor_options.h +60 -0
- package/third-party/include/executorch/runtime/core/result.h +258 -0
- package/third-party/include/executorch/runtime/core/span.h +97 -0
- package/third-party/include/executorch/runtime/core/tag.h +90 -0
- package/third-party/include/executorch/runtime/core/tensor_layout.h +79 -0
- package/third-party/include/executorch/runtime/core/tensor_shape_dynamism.h +39 -0
- package/third-party/include/executorch/runtime/executor/memory_manager.h +113 -0
- package/third-party/include/executorch/runtime/executor/merged_data_map.h +142 -0
- package/third-party/include/executorch/runtime/executor/method.h +412 -0
- package/third-party/include/executorch/runtime/executor/method_meta.h +298 -0
- package/third-party/include/executorch/runtime/executor/program.h +309 -0
- package/third-party/include/executorch/runtime/executor/pte_data_map.h +145 -0
- package/third-party/include/executorch/runtime/executor/tensor_parser.h +157 -0
- package/third-party/include/executorch/runtime/kernel/kernel_runtime_context.h +122 -0
- package/third-party/include/executorch/runtime/kernel/operator_registry.h +280 -0
- package/third-party/include/executorch/runtime/platform/abort.h +36 -0
- package/third-party/include/executorch/runtime/platform/assert.h +119 -0
- package/third-party/include/executorch/runtime/platform/clock.h +43 -0
- package/third-party/include/executorch/runtime/platform/compat_unistd.h +75 -0
- package/third-party/include/executorch/runtime/platform/compiler.h +201 -0
- package/third-party/include/executorch/runtime/platform/log.h +177 -0
- package/third-party/include/executorch/runtime/platform/platform.h +259 -0
- package/third-party/include/executorch/runtime/platform/profiler.h +292 -0
- package/third-party/include/executorch/runtime/platform/runtime.h +35 -0
- package/third-party/include/executorch/runtime/platform/system.h +49 -0
- package/third-party/include/executorch/runtime/platform/types.h +24 -0
- package/third-party/include/executorch/schema/extended_header.h +85 -0
- package/third-party/include/headeronly/macros/Export.h +88 -0
- package/third-party/include/opencv2/core/affine.hpp +676 -0
- package/third-party/include/opencv2/core/async.hpp +107 -0
- package/third-party/include/opencv2/core/base.hpp +735 -0
- package/third-party/include/opencv2/core/bindings_utils.hpp +279 -0
- package/third-party/include/opencv2/core/bufferpool.hpp +39 -0
- package/third-party/include/opencv2/core/check.hpp +231 -0
- package/third-party/include/opencv2/core/core.hpp +55 -0
- package/third-party/include/opencv2/core/core_c.h +3261 -0
- package/third-party/include/opencv2/core/cv_cpu_dispatch.h +404 -0
- package/third-party/include/opencv2/core/cv_cpu_helper.h +856 -0
- package/third-party/include/opencv2/core/cvdef.h +1003 -0
- package/third-party/include/opencv2/core/cvstd.hpp +196 -0
- package/third-party/include/opencv2/core/cvstd.inl.hpp +188 -0
- package/third-party/include/opencv2/core/cvstd_wrapper.hpp +187 -0
- package/third-party/include/opencv2/core/detail/async_promise.hpp +73 -0
- package/third-party/include/opencv2/core/detail/dispatch_helper.impl.hpp +48 -0
- package/third-party/include/opencv2/core/detail/exception_ptr.hpp +24 -0
- package/third-party/include/opencv2/core/dualquaternion.hpp +1054 -0
- package/third-party/include/opencv2/core/dualquaternion.inl.hpp +464 -0
- package/third-party/include/opencv2/core/eigen.hpp +405 -0
- package/third-party/include/opencv2/core/fast_math.hpp +433 -0
- package/third-party/include/opencv2/core/hal/hal.hpp +451 -0
- package/third-party/include/opencv2/core/hal/interface.h +191 -0
- package/third-party/include/opencv2/core/hal/intrin.hpp +1222 -0
- package/third-party/include/opencv2/core/hal/intrin_avx.hpp +3378 -0
- package/third-party/include/opencv2/core/hal/intrin_avx512.hpp +3688 -0
- package/third-party/include/opencv2/core/hal/intrin_cpp.hpp +3446 -0
- package/third-party/include/opencv2/core/hal/intrin_forward.hpp +195 -0
- package/third-party/include/opencv2/core/hal/intrin_lasx.hpp +3243 -0
- package/third-party/include/opencv2/core/hal/intrin_lsx.hpp +2671 -0
- package/third-party/include/opencv2/core/hal/intrin_math.hpp +772 -0
- package/third-party/include/opencv2/core/hal/intrin_msa.hpp +1973 -0
- package/third-party/include/opencv2/core/hal/intrin_neon.hpp +2710 -0
- package/third-party/include/opencv2/core/hal/intrin_rvv071.hpp +3452 -0
- package/third-party/include/opencv2/core/hal/intrin_rvv_scalable.hpp +2559 -0
- package/third-party/include/opencv2/core/hal/intrin_sse.hpp +3528 -0
- package/third-party/include/opencv2/core/hal/intrin_sse_em.hpp +175 -0
- package/third-party/include/opencv2/core/hal/intrin_vsx.hpp +1756 -0
- package/third-party/include/opencv2/core/hal/intrin_wasm.hpp +2911 -0
- package/third-party/include/opencv2/core/hal/msa_macros.h +2079 -0
- package/third-party/include/opencv2/core/hal/simd_utils.impl.hpp +313 -0
- package/third-party/include/opencv2/core/mat.hpp +3842 -0
- package/third-party/include/opencv2/core/mat.inl.hpp +2753 -0
- package/third-party/include/opencv2/core/matx.hpp +603 -0
- package/third-party/include/opencv2/core/matx.inl.hpp +1132 -0
- package/third-party/include/opencv2/core/neon_utils.hpp +127 -0
- package/third-party/include/opencv2/core/operations.hpp +610 -0
- package/third-party/include/opencv2/core/optim.hpp +362 -0
- package/third-party/include/opencv2/core/parallel/backend/parallel_for.openmp.hpp +66 -0
- package/third-party/include/opencv2/core/parallel/backend/parallel_for.tbb.hpp +148 -0
- package/third-party/include/opencv2/core/parallel/parallel_backend.hpp +108 -0
- package/third-party/include/opencv2/core/persistence.hpp +1321 -0
- package/third-party/include/opencv2/core/quaternion.hpp +1889 -0
- package/third-party/include/opencv2/core/quaternion.inl.hpp +907 -0
- package/third-party/include/opencv2/core/saturate.hpp +347 -0
- package/third-party/include/opencv2/core/simd_intrinsics.hpp +90 -0
- package/third-party/include/opencv2/core/softfloat.hpp +657 -0
- package/third-party/include/opencv2/core/sse_utils.hpp +861 -0
- package/third-party/include/opencv2/core/traits.hpp +417 -0
- package/third-party/include/opencv2/core/types.hpp +2368 -0
- package/third-party/include/opencv2/core/types_c.h +2064 -0
- package/third-party/include/opencv2/core/utility.hpp +1296 -0
- package/third-party/include/opencv2/core/utils/allocator_stats.hpp +31 -0
- package/third-party/include/opencv2/core/utils/allocator_stats.impl.hpp +111 -0
- package/third-party/include/opencv2/core/utils/filesystem.hpp +91 -0
- package/third-party/include/opencv2/core/utils/fp_control_utils.hpp +70 -0
- package/third-party/include/opencv2/core/utils/instrumentation.hpp +127 -0
- package/third-party/include/opencv2/core/utils/logger.defines.hpp +50 -0
- package/third-party/include/opencv2/core/utils/logger.hpp +258 -0
- package/third-party/include/opencv2/core/utils/logtag.hpp +27 -0
- package/third-party/include/opencv2/core/utils/tls.hpp +230 -0
- package/third-party/include/opencv2/core/utils/trace.hpp +281 -0
- package/third-party/include/opencv2/core/version.hpp +29 -0
- package/third-party/include/opencv2/core/vsx_utils.hpp +1115 -0
- package/third-party/include/opencv2/core.hpp +3699 -0
- package/third-party/include/opencv2/cvconfig.h +155 -0
- package/third-party/include/opencv2/dnn/dnn.hpp +51 -0
- package/third-party/include/opencv2/dnn.hpp +17 -0
- package/third-party/include/opencv2/features2d/features2d.hpp +55 -0
- package/third-party/include/opencv2/features2d/hal/interface.h +32 -0
- package/third-party/include/opencv2/features2d.hpp +1756 -0
- package/third-party/include/opencv2/highgui/highgui.hpp +113 -0
- package/third-party/include/opencv2/highgui.hpp +17 -0
- package/third-party/include/opencv2/imgproc/bindings.hpp +34 -0
- package/third-party/include/opencv2/imgproc/detail/gcgraph.hpp +355 -0
- package/third-party/include/opencv2/imgproc/detail/legacy.hpp +35 -0
- package/third-party/include/opencv2/imgproc/hal/hal.hpp +246 -0
- package/third-party/include/opencv2/imgproc/hal/interface.h +52 -0
- package/third-party/include/opencv2/imgproc/imgproc.hpp +55 -0
- package/third-party/include/opencv2/imgproc/imgproc_c.h +1261 -0
- package/third-party/include/opencv2/imgproc/segmentation.hpp +168 -0
- package/third-party/include/opencv2/imgproc/types_c.h +632 -0
- package/third-party/include/opencv2/imgproc.hpp +5956 -0
- package/third-party/include/opencv2/opencv.hpp +102 -0
- package/third-party/include/opencv2/opencv_modules.hpp +19 -0
- package/third-party/include/opencv2/photo/legacy/constants_c.h +10 -0
- package/third-party/include/opencv2/photo/photo.hpp +55 -0
- package/third-party/include/opencv2/photo.hpp +975 -0
- package/third-party/include/opencv2/video/background_segm.hpp +341 -0
- package/third-party/include/opencv2/video/detail/tracking.detail.hpp +435 -0
- package/third-party/include/opencv2/video/legacy/constants_c.h +15 -0
- package/third-party/include/opencv2/video/tracking.hpp +1014 -0
- package/third-party/include/opencv2/video/video.hpp +55 -0
- package/third-party/include/opencv2/video.hpp +65 -0
- package/third-party/include/pthreadpool/pthreadpool.h +2236 -0
- package/third-party/include/tokenizers-cpp/tokenizers_c.h +61 -0
- package/third-party/include/tokenizers-cpp/tokenizers_cpp.h +118 -0
- package/third-party/include/torch/headeronly/macros/Export.h +154 -0
- package/third-party/include/torch/headeronly/macros/Macros.h +553 -0
- package/third-party/include/torch/headeronly/util/BFloat16.h +477 -0
- package/third-party/include/torch/headeronly/util/Half.h +781 -0
- package/third-party/include/torch/headeronly/util/TypeSafeSignMath.h +141 -0
- package/third-party/include/torch/headeronly/util/bit_cast.h +49 -0
- package/third-party/include/torch/headeronly/util/complex.h +593 -0
- package/third-party/include/torch/headeronly/util/floating_point_utils.h +38 -0
- package/third-party/ios/ExecutorchLib.xcframework/ios-arm64/ExecutorchLib.framework/ExecutorchLib +0 -0
- package/{ios → third-party/ios}/ExecutorchLib.xcframework/ios-arm64/ExecutorchLib.framework/Info.plist +0 -0
- package/third-party/ios/ExecutorchLib.xcframework/ios-arm64-simulator/ExecutorchLib.framework/ExecutorchLib +0 -0
- package/{ios → third-party/ios}/ExecutorchLib.xcframework/ios-arm64-simulator/ExecutorchLib.framework/Info.plist +0 -0
- package/third-party/ios/libs/cpuinfo/libcpuinfo.a +0 -0
- package/third-party/ios/libs/pthreadpool/physical-arm64-release/libpthreadpool.a +0 -0
- package/third-party/ios/libs/pthreadpool/simulator-arm64-debug/libpthreadpool.a +0 -0
- package/third-party/ios/libs/tokenizers-cpp/physical-arm64-release/libsentencepiece.a +0 -0
- package/{ios/ExecutorchLib.xcframework/ios-arm64/ExecutorchLib.framework/ExecutorchLib → third-party/ios/libs/tokenizers-cpp/physical-arm64-release/libtokenizers_c.a} +0 -0
- package/third-party/ios/libs/tokenizers-cpp/physical-arm64-release/libtokenizers_cpp.a +0 -0
- package/third-party/ios/libs/tokenizers-cpp/simulator-arm64-debug/libsentencepiece.a +0 -0
- package/third-party/ios/libs/tokenizers-cpp/simulator-arm64-debug/libtokenizers_c.a +0 -0
- package/third-party/ios/libs/tokenizers-cpp/simulator-arm64-debug/libtokenizers_cpp.a +0 -0
- package/LICENSE +0 -79
- package/android/src/main/java/com/swmansion/rnexecutorch/Classification.kt +0 -64
- package/android/src/main/java/com/swmansion/rnexecutorch/ETModule.kt +0 -90
- package/android/src/main/java/com/swmansion/rnexecutorch/ImageSegmentation.kt +0 -58
- package/android/src/main/java/com/swmansion/rnexecutorch/LLM.kt +0 -63
- package/android/src/main/java/com/swmansion/rnexecutorch/OCR.kt +0 -90
- package/android/src/main/java/com/swmansion/rnexecutorch/ObjectDetection.kt +0 -64
- package/android/src/main/java/com/swmansion/rnexecutorch/SpeechToText.kt +0 -91
- package/android/src/main/java/com/swmansion/rnexecutorch/StyleTransfer.kt +0 -54
- package/android/src/main/java/com/swmansion/rnexecutorch/TextEmbeddings.kt +0 -51
- package/android/src/main/java/com/swmansion/rnexecutorch/Tokenizer.kt +0 -86
- package/android/src/main/java/com/swmansion/rnexecutorch/VerticalOCR.kt +0 -179
- package/android/src/main/java/com/swmansion/rnexecutorch/models/BaseModel.kt +0 -54
- package/android/src/main/java/com/swmansion/rnexecutorch/models/TextEmbeddings/TextEmbeddingsModel.kt +0 -48
- package/android/src/main/java/com/swmansion/rnexecutorch/models/TextEmbeddings/TextEmbeddingsUtils.kt +0 -37
- package/android/src/main/java/com/swmansion/rnexecutorch/models/classification/ClassificationModel.kt +0 -46
- package/android/src/main/java/com/swmansion/rnexecutorch/models/classification/Constants.kt +0 -1005
- package/android/src/main/java/com/swmansion/rnexecutorch/models/imageSegmentation/Constants.kt +0 -26
- package/android/src/main/java/com/swmansion/rnexecutorch/models/imageSegmentation/ImageSegmentationModel.kt +0 -142
- package/android/src/main/java/com/swmansion/rnexecutorch/models/objectDetection/SSDLiteLargeModel.kt +0 -74
- package/android/src/main/java/com/swmansion/rnexecutorch/models/ocr/Detector.kt +0 -82
- package/android/src/main/java/com/swmansion/rnexecutorch/models/ocr/RecognitionHandler.kt +0 -117
- package/android/src/main/java/com/swmansion/rnexecutorch/models/ocr/Recognizer.kt +0 -51
- package/android/src/main/java/com/swmansion/rnexecutorch/models/ocr/VerticalDetector.kt +0 -89
- package/android/src/main/java/com/swmansion/rnexecutorch/models/ocr/utils/CTCLabelConverter.kt +0 -58
- package/android/src/main/java/com/swmansion/rnexecutorch/models/ocr/utils/Constants.kt +0 -31
- package/android/src/main/java/com/swmansion/rnexecutorch/models/ocr/utils/DetectorUtils.kt +0 -608
- package/android/src/main/java/com/swmansion/rnexecutorch/models/ocr/utils/RecognizerUtils.kt +0 -430
- package/android/src/main/java/com/swmansion/rnexecutorch/models/speechToText/BaseS2TDecoder.kt +0 -39
- package/android/src/main/java/com/swmansion/rnexecutorch/models/speechToText/BaseS2TModule.kt +0 -43
- package/android/src/main/java/com/swmansion/rnexecutorch/models/speechToText/Moonshine.kt +0 -16
- package/android/src/main/java/com/swmansion/rnexecutorch/models/speechToText/MoonshineDecoder.kt +0 -23
- package/android/src/main/java/com/swmansion/rnexecutorch/models/speechToText/MoonshineEncoder.kt +0 -20
- package/android/src/main/java/com/swmansion/rnexecutorch/models/speechToText/Whisper.kt +0 -16
- package/android/src/main/java/com/swmansion/rnexecutorch/models/speechToText/WhisperDecoder.kt +0 -22
- package/android/src/main/java/com/swmansion/rnexecutorch/models/speechToText/WhisperEncoder.kt +0 -29
- package/android/src/main/java/com/swmansion/rnexecutorch/models/styleTransfer/StyleTransferModel.kt +0 -43
- package/android/src/main/java/com/swmansion/rnexecutorch/utils/ArrayUtils.kt +0 -87
- package/android/src/main/java/com/swmansion/rnexecutorch/utils/ETError.kt +0 -34
- package/android/src/main/java/com/swmansion/rnexecutorch/utils/ImageProcessor.kt +0 -237
- package/android/src/main/java/com/swmansion/rnexecutorch/utils/Numerical.kt +0 -8
- package/android/src/main/java/com/swmansion/rnexecutorch/utils/ObjectDetectionUtils.kt +0 -201
- package/android/src/main/java/com/swmansion/rnexecutorch/utils/STFT.kt +0 -50
- package/android/src/main/java/com/swmansion/rnexecutorch/utils/TensorUtils.kt +0 -103
- package/ios/ExecutorchLib.xcframework/ios-arm64/ExecutorchLib.framework/Headers/ETModel.h +0 -27
- package/ios/ExecutorchLib.xcframework/ios-arm64/ExecutorchLib.framework/Headers/HuggingFaceTokenizer.h +0 -14
- package/ios/ExecutorchLib.xcframework/ios-arm64/ExecutorchLib.framework/Headers/LLaMARunner.h +0 -32
- package/ios/ExecutorchLib.xcframework/ios-arm64-simulator/ExecutorchLib.framework/Headers/ETModel.h +0 -27
- package/ios/ExecutorchLib.xcframework/ios-arm64-simulator/ExecutorchLib.framework/Headers/HuggingFaceTokenizer.h +0 -14
- package/ios/ExecutorchLib.xcframework/ios-arm64-simulator/ExecutorchLib.framework/Headers/LLaMARunner.h +0 -32
- package/ios/RnExecutorch/Classification.h +0 -5
- package/ios/RnExecutorch/Classification.mm +0 -54
- package/ios/RnExecutorch/ETModule.h +0 -5
- package/ios/RnExecutorch/ETModule.mm +0 -75
- package/ios/RnExecutorch/ImageSegmentation.h +0 -5
- package/ios/RnExecutorch/ImageSegmentation.mm +0 -60
- package/ios/RnExecutorch/LLM.h +0 -5
- package/ios/RnExecutorch/LLM.mm +0 -78
- package/ios/RnExecutorch/OCR.h +0 -5
- package/ios/RnExecutorch/OCR.mm +0 -96
- package/ios/RnExecutorch/ObjectDetection.h +0 -5
- package/ios/RnExecutorch/ObjectDetection.mm +0 -56
- package/ios/RnExecutorch/SpeechToText.h +0 -5
- package/ios/RnExecutorch/SpeechToText.mm +0 -125
- package/ios/RnExecutorch/StyleTransfer.h +0 -5
- package/ios/RnExecutorch/StyleTransfer.mm +0 -55
- package/ios/RnExecutorch/TextEmbeddings.h +0 -5
- package/ios/RnExecutorch/TextEmbeddings.mm +0 -62
- package/ios/RnExecutorch/Tokenizer.h +0 -5
- package/ios/RnExecutorch/Tokenizer.mm +0 -83
- package/ios/RnExecutorch/VerticalOCR.h +0 -5
- package/ios/RnExecutorch/VerticalOCR.mm +0 -183
- package/ios/RnExecutorch/models/BaseModel.h +0 -21
- package/ios/RnExecutorch/models/BaseModel.mm +0 -43
- package/ios/RnExecutorch/models/classification/ClassificationModel.h +0 -10
- package/ios/RnExecutorch/models/classification/ClassificationModel.mm +0 -53
- package/ios/RnExecutorch/models/classification/Constants.h +0 -3
- package/ios/RnExecutorch/models/image_segmentation/Constants.h +0 -4
- package/ios/RnExecutorch/models/image_segmentation/ImageSegmentationModel.h +0 -10
- package/ios/RnExecutorch/models/image_segmentation/ImageSegmentationModel.mm +0 -146
- package/ios/RnExecutorch/models/object_detection/SSDLiteLargeModel.hpp +0 -11
- package/ios/RnExecutorch/models/object_detection/SSDLiteLargeModel.mm +0 -64
- package/ios/RnExecutorch/models/ocr/Detector.h +0 -9
- package/ios/RnExecutorch/models/ocr/Detector.mm +0 -101
- package/ios/RnExecutorch/models/ocr/RecognitionHandler.h +0 -16
- package/ios/RnExecutorch/models/ocr/RecognitionHandler.mm +0 -135
- package/ios/RnExecutorch/models/ocr/Recognizer.h +0 -8
- package/ios/RnExecutorch/models/ocr/Recognizer.mm +0 -77
- package/ios/RnExecutorch/models/ocr/VerticalDetector.h +0 -10
- package/ios/RnExecutorch/models/ocr/VerticalDetector.mm +0 -118
- package/ios/RnExecutorch/models/ocr/utils/CTCLabelConverter.h +0 -16
- package/ios/RnExecutorch/models/ocr/utils/CTCLabelConverter.mm +0 -80
- package/ios/RnExecutorch/models/ocr/utils/Constants.h +0 -26
- package/ios/RnExecutorch/models/ocr/utils/DetectorUtils.h +0 -31
- package/ios/RnExecutorch/models/ocr/utils/DetectorUtils.mm +0 -754
- package/ios/RnExecutorch/models/ocr/utils/OCRUtils.h +0 -10
- package/ios/RnExecutorch/models/ocr/utils/OCRUtils.mm +0 -67
- package/ios/RnExecutorch/models/ocr/utils/RecognizerUtils.h +0 -35
- package/ios/RnExecutorch/models/ocr/utils/RecognizerUtils.mm +0 -331
- package/ios/RnExecutorch/models/stt/Moonshine.hpp +0 -13
- package/ios/RnExecutorch/models/stt/Moonshine.mm +0 -64
- package/ios/RnExecutorch/models/stt/MoonshineDecoder.hpp +0 -16
- package/ios/RnExecutorch/models/stt/MoonshineDecoder.mm +0 -24
- package/ios/RnExecutorch/models/stt/MoonshineEncoder.hpp +0 -15
- package/ios/RnExecutorch/models/stt/MoonshineEncoder.mm +0 -18
- package/ios/RnExecutorch/models/stt/SpeechToTextBaseModel.hpp +0 -26
- package/ios/RnExecutorch/models/stt/SpeechToTextBaseModel.mm +0 -19
- package/ios/RnExecutorch/models/stt/Whisper.hpp +0 -12
- package/ios/RnExecutorch/models/stt/Whisper.mm +0 -68
- package/ios/RnExecutorch/models/stt/WhisperDecoder.hpp +0 -16
- package/ios/RnExecutorch/models/stt/WhisperDecoder.mm +0 -22
- package/ios/RnExecutorch/models/stt/WhisperEncoder.hpp +0 -15
- package/ios/RnExecutorch/models/stt/WhisperEncoder.mm +0 -21
- package/ios/RnExecutorch/models/style_transfer/StyleTransferModel.h +0 -11
- package/ios/RnExecutorch/models/style_transfer/StyleTransferModel.mm +0 -50
- package/ios/RnExecutorch/models/text_embeddings/TextEmbeddingsModel.h +0 -15
- package/ios/RnExecutorch/models/text_embeddings/TextEmbeddingsModel.mm +0 -45
- package/ios/RnExecutorch/models/text_embeddings/TextEmbeddingsUtils.h +0 -8
- package/ios/RnExecutorch/models/text_embeddings/TextEmbeddingsUtils.mm +0 -49
- package/ios/RnExecutorch/utils/Constants.h +0 -8
- package/ios/RnExecutorch/utils/Conversions.h +0 -15
- package/ios/RnExecutorch/utils/ETError.h +0 -26
- package/ios/RnExecutorch/utils/ImageProcessor.h +0 -15
- package/ios/RnExecutorch/utils/ImageProcessor.mm +0 -147
- package/ios/RnExecutorch/utils/Numerical.h +0 -1
- package/ios/RnExecutorch/utils/Numerical.mm +0 -18
- package/ios/RnExecutorch/utils/ObjectDetectionUtils.hpp +0 -23
- package/ios/RnExecutorch/utils/SFFT.hpp +0 -13
- package/ios/RnExecutorch/utils/SFFT.mm +0 -71
- package/ios/RnExecutorch/utils/ScalarType.h +0 -14
- package/ios/RnExecutorch/utils/ScalarType.mm +0 -21
- package/lib/module/constants/sttDefaults.js +0 -72
- package/lib/module/constants/sttDefaults.js.map +0 -1
- package/lib/module/controllers/SpeechToTextController.js +0 -307
- package/lib/module/controllers/SpeechToTextController.js.map +0 -1
- package/lib/module/native/NativeClassification.js +0 -5
- package/lib/module/native/NativeClassification.js.map +0 -1
- package/lib/module/native/NativeETModule.js +0 -5
- package/lib/module/native/NativeETModule.js.map +0 -1
- package/lib/module/native/NativeImageSegmentation.js +0 -5
- package/lib/module/native/NativeImageSegmentation.js.map +0 -1
- package/lib/module/native/NativeLLM.js +0 -5
- package/lib/module/native/NativeLLM.js.map +0 -1
- package/lib/module/native/NativeOCR.js +0 -5
- package/lib/module/native/NativeOCR.js.map +0 -1
- package/lib/module/native/NativeObjectDetection.js +0 -5
- package/lib/module/native/NativeObjectDetection.js.map +0 -1
- package/lib/module/native/NativeSpeechToText.js +0 -5
- package/lib/module/native/NativeSpeechToText.js.map +0 -1
- package/lib/module/native/NativeStyleTransfer.js +0 -5
- package/lib/module/native/NativeStyleTransfer.js.map +0 -1
- package/lib/module/native/NativeTextEmbeddings.js +0 -5
- package/lib/module/native/NativeTextEmbeddings.js.map +0 -1
- package/lib/module/native/NativeTokenizer.js +0 -5
- package/lib/module/native/NativeTokenizer.js.map +0 -1
- package/lib/module/native/NativeVerticalOCR.js +0 -5
- package/lib/module/native/NativeVerticalOCR.js.map +0 -1
- package/lib/module/package.json +0 -1
- package/lib/module/utils/stt.js +0 -22
- package/lib/module/utils/stt.js.map +0 -1
- package/lib/typescript/constants/sttDefaults.d.ts +0 -28
- package/lib/typescript/constants/sttDefaults.d.ts.map +0 -1
- package/lib/typescript/controllers/SpeechToTextController.d.ts +0 -52
- package/lib/typescript/controllers/SpeechToTextController.d.ts.map +0 -1
- package/lib/typescript/native/NativeClassification.d.ts +0 -10
- package/lib/typescript/native/NativeClassification.d.ts.map +0 -1
- package/lib/typescript/native/NativeETModule.d.ts +0 -9
- package/lib/typescript/native/NativeETModule.d.ts.map +0 -1
- package/lib/typescript/native/NativeImageSegmentation.d.ts +0 -10
- package/lib/typescript/native/NativeImageSegmentation.d.ts.map +0 -1
- package/lib/typescript/native/NativeLLM.d.ts +0 -12
- package/lib/typescript/native/NativeLLM.d.ts.map +0 -1
- package/lib/typescript/native/NativeOCR.d.ts +0 -9
- package/lib/typescript/native/NativeOCR.d.ts.map +0 -1
- package/lib/typescript/native/NativeObjectDetection.d.ts +0 -9
- package/lib/typescript/native/NativeObjectDetection.d.ts.map +0 -1
- package/lib/typescript/native/NativeSpeechToText.d.ts +0 -12
- package/lib/typescript/native/NativeSpeechToText.d.ts.map +0 -1
- package/lib/typescript/native/NativeStyleTransfer.d.ts.map +0 -1
- package/lib/typescript/native/NativeTextEmbeddings.d.ts +0 -8
- package/lib/typescript/native/NativeTextEmbeddings.d.ts.map +0 -1
- package/lib/typescript/native/NativeTokenizer.d.ts +0 -12
- package/lib/typescript/native/NativeTokenizer.d.ts.map +0 -1
- package/lib/typescript/native/NativeVerticalOCR.d.ts +0 -9
- package/lib/typescript/native/NativeVerticalOCR.d.ts.map +0 -1
- package/lib/typescript/utils/stt.d.ts +0 -2
- package/lib/typescript/utils/stt.d.ts.map +0 -1
- package/src/constants/sttDefaults.ts +0 -86
- package/src/controllers/SpeechToTextController.ts +0 -458
- package/src/index.tsx +0 -47
- package/src/native/NativeClassification.ts +0 -9
- package/src/native/NativeETModule.ts +0 -14
- package/src/native/NativeImageSegmentation.ts +0 -14
- package/src/native/NativeLLM.ts +0 -14
- package/src/native/NativeOCR.ts +0 -16
- package/src/native/NativeObjectDetection.ts +0 -10
- package/src/native/NativeSpeechToText.ts +0 -17
- package/src/native/NativeStyleTransfer.ts +0 -10
- package/src/native/NativeTextEmbeddings.ts +0 -9
- package/src/native/NativeTokenizer.ts +0 -13
- package/src/native/NativeVerticalOCR.ts +0 -16
- package/src/utils/stt.ts +0 -28
- package/{ios → third-party/ios}/ExecutorchLib.xcframework/Info.plist +4 -4
|
@@ -1,53 +0,0 @@
|
|
|
1
|
-
#import "ClassificationModel.h"
|
|
2
|
-
#import "../../utils/ImageProcessor.h"
|
|
3
|
-
#import "../../utils/Numerical.h"
|
|
4
|
-
#import "Constants.h"
|
|
5
|
-
|
|
6
|
-
@implementation ClassificationModel
|
|
7
|
-
|
|
8
|
-
- (cv::Size)getModelImageSize {
|
|
9
|
-
NSArray *inputShape = [module getInputShape:0];
|
|
10
|
-
NSNumber *widthNumber = inputShape.lastObject;
|
|
11
|
-
NSNumber *heightNumber = inputShape[inputShape.count - 2];
|
|
12
|
-
|
|
13
|
-
int height = [heightNumber intValue];
|
|
14
|
-
int width = [widthNumber intValue];
|
|
15
|
-
|
|
16
|
-
return cv::Size(height, width);
|
|
17
|
-
}
|
|
18
|
-
|
|
19
|
-
- (NSArray *)preprocess:(cv::Mat &)input {
|
|
20
|
-
cv::Size modelImageSize = [self getModelImageSize];
|
|
21
|
-
cv::resize(input, input, modelImageSize);
|
|
22
|
-
|
|
23
|
-
NSArray *modelInput = [ImageProcessor matToNSArray:input];
|
|
24
|
-
return modelInput;
|
|
25
|
-
}
|
|
26
|
-
|
|
27
|
-
- (NSDictionary *)postprocess:(NSArray *)output {
|
|
28
|
-
output = output[0]; // take the first output tensor
|
|
29
|
-
std::vector<double> outputVector(output.count);
|
|
30
|
-
|
|
31
|
-
for (NSUInteger i = 0; i < output.count; ++i) {
|
|
32
|
-
outputVector[i] = [output[i] doubleValue];
|
|
33
|
-
}
|
|
34
|
-
|
|
35
|
-
std::vector<double> probabilities = softmax(outputVector);
|
|
36
|
-
NSMutableDictionary *result = [NSMutableDictionary dictionary];
|
|
37
|
-
|
|
38
|
-
for (int i = 0; i < probabilities.size(); ++i) {
|
|
39
|
-
NSString *className = @(imagenet1k_v1_labels[i].c_str());
|
|
40
|
-
NSNumber *probability = @(probabilities[i]);
|
|
41
|
-
result[className] = probability;
|
|
42
|
-
}
|
|
43
|
-
|
|
44
|
-
return result;
|
|
45
|
-
}
|
|
46
|
-
|
|
47
|
-
- (NSDictionary *)runModel:(cv::Mat &)input {
|
|
48
|
-
NSArray *modelInput = [self preprocess:input];
|
|
49
|
-
NSArray *modelOutput = [self forward:@[ modelInput ]];
|
|
50
|
-
return [self postprocess:modelOutput];
|
|
51
|
-
}
|
|
52
|
-
|
|
53
|
-
@end
|
|
@@ -1,10 +0,0 @@
|
|
|
1
|
-
#import "../BaseModel.h"
|
|
2
|
-
#import "opencv2/opencv.hpp"
|
|
3
|
-
|
|
4
|
-
@interface ImageSegmentationModel : BaseModel
|
|
5
|
-
- (cv::Size)getModelImageSize;
|
|
6
|
-
- (NSDictionary *)runModel:(cv::Mat &)input
|
|
7
|
-
returnClasses:(NSArray *)classesOfInterest
|
|
8
|
-
resize:(BOOL)resize;
|
|
9
|
-
|
|
10
|
-
@end
|
|
@@ -1,146 +0,0 @@
|
|
|
1
|
-
#import "ImageSegmentationModel.h"
|
|
2
|
-
#import "../../utils/Conversions.h"
|
|
3
|
-
#import "../../utils/ImageProcessor.h"
|
|
4
|
-
#import "../../utils/Numerical.h"
|
|
5
|
-
#import "Constants.h"
|
|
6
|
-
#import <unordered_set>
|
|
7
|
-
|
|
8
|
-
@interface ImageSegmentationModel ()
|
|
9
|
-
- (NSArray *)preprocess:(cv::Mat &)input;
|
|
10
|
-
- (NSDictionary *)postprocess:(NSArray *)output
|
|
11
|
-
returnClasses:(NSArray *)classesOfInterest
|
|
12
|
-
resize:(BOOL)resize;
|
|
13
|
-
@end
|
|
14
|
-
|
|
15
|
-
@implementation ImageSegmentationModel {
|
|
16
|
-
cv::Size originalSize;
|
|
17
|
-
}
|
|
18
|
-
|
|
19
|
-
- (cv::Size)getModelImageSize {
|
|
20
|
-
NSArray *inputShape = [module getInputShape:@0];
|
|
21
|
-
NSNumber *widthNumber = inputShape.lastObject;
|
|
22
|
-
NSNumber *heightNumber = inputShape[inputShape.count - 2];
|
|
23
|
-
|
|
24
|
-
int height = [heightNumber intValue];
|
|
25
|
-
int width = [widthNumber intValue];
|
|
26
|
-
|
|
27
|
-
return cv::Size(height, width);
|
|
28
|
-
}
|
|
29
|
-
|
|
30
|
-
- (NSArray *)preprocess:(cv::Mat &)input {
|
|
31
|
-
originalSize = cv::Size(input.cols, input.rows);
|
|
32
|
-
|
|
33
|
-
cv::Size modelImageSize = [self getModelImageSize];
|
|
34
|
-
cv::Mat output;
|
|
35
|
-
cv::resize(input, output, modelImageSize);
|
|
36
|
-
|
|
37
|
-
NSArray *modelInput = [ImageProcessor matToNSArray:output];
|
|
38
|
-
return modelInput;
|
|
39
|
-
}
|
|
40
|
-
|
|
41
|
-
std::vector<cv::Mat> extractResults(NSArray *result, std::size_t numLabels,
|
|
42
|
-
cv::Size modelImageSize,
|
|
43
|
-
cv::Size originalSize, BOOL resize) {
|
|
44
|
-
std::size_t numModelPixels = modelImageSize.height * modelImageSize.width;
|
|
45
|
-
|
|
46
|
-
std::vector<cv::Mat> resizedLabelScores(numLabels);
|
|
47
|
-
for (std::size_t label = 0; label < numLabels; ++label) {
|
|
48
|
-
cv::Mat labelMat = cv::Mat(modelImageSize, CV_64F);
|
|
49
|
-
|
|
50
|
-
for (std::size_t pixel = 0; pixel < numModelPixels; ++pixel) {
|
|
51
|
-
int row = pixel / modelImageSize.width;
|
|
52
|
-
int col = pixel % modelImageSize.width;
|
|
53
|
-
labelMat.at<double>(row, col) =
|
|
54
|
-
[result[label * numModelPixels + pixel] doubleValue];
|
|
55
|
-
}
|
|
56
|
-
|
|
57
|
-
if (resize) {
|
|
58
|
-
cv::resize(labelMat, resizedLabelScores[label], originalSize);
|
|
59
|
-
} else {
|
|
60
|
-
resizedLabelScores[label] = std::move(labelMat);
|
|
61
|
-
}
|
|
62
|
-
}
|
|
63
|
-
return resizedLabelScores;
|
|
64
|
-
}
|
|
65
|
-
|
|
66
|
-
void adjustScoresPerPixel(std::vector<cv::Mat> &labelScores, cv::Mat &argMax,
|
|
67
|
-
cv::Size outputSize, std::size_t numLabels) {
|
|
68
|
-
std::size_t numOutputPixels = outputSize.height * outputSize.width;
|
|
69
|
-
for (std::size_t pixel = 0; pixel < numOutputPixels; ++pixel) {
|
|
70
|
-
int row = pixel / outputSize.width;
|
|
71
|
-
int col = pixel % outputSize.width;
|
|
72
|
-
std::vector<double> scores;
|
|
73
|
-
scores.reserve(numLabels);
|
|
74
|
-
for (const auto &mat : labelScores) {
|
|
75
|
-
scores.push_back(mat.at<double>(row, col));
|
|
76
|
-
}
|
|
77
|
-
|
|
78
|
-
std::vector<double> adjustedScores = softmax(scores);
|
|
79
|
-
|
|
80
|
-
for (std::size_t label = 0; label < numLabels; ++label) {
|
|
81
|
-
labelScores[label].at<double>(row, col) = adjustedScores[label];
|
|
82
|
-
}
|
|
83
|
-
|
|
84
|
-
auto maxIt = std::max_element(scores.begin(), scores.end());
|
|
85
|
-
argMax.at<int>(row, col) = std::distance(scores.begin(), maxIt);
|
|
86
|
-
}
|
|
87
|
-
}
|
|
88
|
-
|
|
89
|
-
- (NSDictionary *)postprocess:(NSArray *)output
|
|
90
|
-
returnClasses:(NSArray *)classesOfInterest
|
|
91
|
-
resize:(BOOL)resize {
|
|
92
|
-
cv::Size modelImageSize = [self getModelImageSize];
|
|
93
|
-
|
|
94
|
-
std::size_t numLabels = deeplabv3_resnet50_labels.size();
|
|
95
|
-
|
|
96
|
-
NSAssert((std::size_t)output.count ==
|
|
97
|
-
numLabels * modelImageSize.height * modelImageSize.width,
|
|
98
|
-
@"Model generated unexpected output size.");
|
|
99
|
-
|
|
100
|
-
// For each label extract it's matrix,
|
|
101
|
-
// and rescale it to the original size if `resize`
|
|
102
|
-
std::vector<cv::Mat> resizedLabelScores =
|
|
103
|
-
extractResults(output, numLabels, modelImageSize, originalSize, resize);
|
|
104
|
-
|
|
105
|
-
cv::Size outputSize = resize ? originalSize : modelImageSize;
|
|
106
|
-
cv::Mat argMax = cv::Mat(outputSize, CV_32S);
|
|
107
|
-
|
|
108
|
-
// For each pixel apply softmax across all the labels and calculate the argMax
|
|
109
|
-
adjustScoresPerPixel(resizedLabelScores, argMax, outputSize, numLabels);
|
|
110
|
-
|
|
111
|
-
std::unordered_set<std::string> labelSet;
|
|
112
|
-
|
|
113
|
-
for (id label in classesOfInterest) {
|
|
114
|
-
labelSet.insert(std::string([label UTF8String]));
|
|
115
|
-
}
|
|
116
|
-
|
|
117
|
-
NSMutableDictionary *result = [NSMutableDictionary dictionary];
|
|
118
|
-
|
|
119
|
-
// Convert to NSArray and populate the final dictionary
|
|
120
|
-
for (std::size_t label = 0; label < numLabels; ++label) {
|
|
121
|
-
if (labelSet.contains(deeplabv3_resnet50_labels[label])) {
|
|
122
|
-
NSString *labelString = @(deeplabv3_resnet50_labels[label].c_str());
|
|
123
|
-
NSArray *arr = simpleMatToNSArray<double>(resizedLabelScores[label]);
|
|
124
|
-
result[labelString] = arr;
|
|
125
|
-
}
|
|
126
|
-
}
|
|
127
|
-
|
|
128
|
-
result[@"ARGMAX"] = simpleMatToNSArray<int>(argMax);
|
|
129
|
-
|
|
130
|
-
return result;
|
|
131
|
-
}
|
|
132
|
-
|
|
133
|
-
- (NSDictionary *)runModel:(cv::Mat &)input
|
|
134
|
-
returnClasses:(NSArray *)classesOfInterest
|
|
135
|
-
resize:(BOOL)resize {
|
|
136
|
-
NSArray *modelInput = [self preprocess:input];
|
|
137
|
-
NSArray *result = [self forward:@[ modelInput ]];
|
|
138
|
-
|
|
139
|
-
NSDictionary *output = [self postprocess:result[0]
|
|
140
|
-
returnClasses:classesOfInterest
|
|
141
|
-
resize:resize];
|
|
142
|
-
|
|
143
|
-
return output;
|
|
144
|
-
}
|
|
145
|
-
|
|
146
|
-
@end
|
|
@@ -1,11 +0,0 @@
|
|
|
1
|
-
#import "../BaseModel.h"
|
|
2
|
-
#import <UIKit/UIKit.h>
|
|
3
|
-
#include <opencv2/opencv.hpp>
|
|
4
|
-
|
|
5
|
-
@interface SSDLiteLargeModel : BaseModel
|
|
6
|
-
|
|
7
|
-
- (NSArray *)runModel:(cv::Mat)input;
|
|
8
|
-
- (NSArray *)preprocess:(cv::Mat)input;
|
|
9
|
-
- (NSArray *)postprocess:(NSArray *)input;
|
|
10
|
-
|
|
11
|
-
@end
|
|
@@ -1,64 +0,0 @@
|
|
|
1
|
-
#include "SSDLiteLargeModel.hpp"
|
|
2
|
-
#include "../../utils/ObjectDetectionUtils.hpp"
|
|
3
|
-
#include "ImageProcessor.h"
|
|
4
|
-
|
|
5
|
-
float constexpr iouThreshold = 0.55;
|
|
6
|
-
float constexpr detectionThreshold = 0.7;
|
|
7
|
-
int constexpr modelInputWidth = 320;
|
|
8
|
-
int constexpr modelInputHeight = 320;
|
|
9
|
-
|
|
10
|
-
@implementation SSDLiteLargeModel
|
|
11
|
-
|
|
12
|
-
- (NSArray *)preprocess:(cv::Mat)input {
|
|
13
|
-
cv::resize(input, input, cv::Size(modelInputWidth, modelInputHeight));
|
|
14
|
-
NSArray *modelInput = [ImageProcessor matToNSArray:input];
|
|
15
|
-
return modelInput;
|
|
16
|
-
}
|
|
17
|
-
|
|
18
|
-
- (NSArray *)postprocess:(NSArray *)input
|
|
19
|
-
widthRatio:(float)widthRatio
|
|
20
|
-
heightRatio:(float)heightRatio {
|
|
21
|
-
NSArray *bboxes = [input objectAtIndex:0];
|
|
22
|
-
NSArray *scores = [input objectAtIndex:1];
|
|
23
|
-
NSArray *labels = [input objectAtIndex:2];
|
|
24
|
-
|
|
25
|
-
std::vector<Detection> detections;
|
|
26
|
-
|
|
27
|
-
for (NSUInteger idx = 0; idx < scores.count; idx++) {
|
|
28
|
-
float score = [scores[idx] floatValue];
|
|
29
|
-
float label = [labels[idx] floatValue];
|
|
30
|
-
if (score < detectionThreshold) {
|
|
31
|
-
continue;
|
|
32
|
-
}
|
|
33
|
-
float x1 = [bboxes[idx * 4] floatValue] * widthRatio;
|
|
34
|
-
float y1 = [bboxes[idx * 4 + 1] floatValue] * heightRatio;
|
|
35
|
-
float x2 = [bboxes[idx * 4 + 2] floatValue] * widthRatio;
|
|
36
|
-
float y2 = [bboxes[idx * 4 + 3] floatValue] * heightRatio;
|
|
37
|
-
|
|
38
|
-
Detection det = {x1, y1, x2, y2, label, score};
|
|
39
|
-
detections.push_back(det);
|
|
40
|
-
}
|
|
41
|
-
std::vector<Detection> nms_output = nms(detections, iouThreshold);
|
|
42
|
-
|
|
43
|
-
NSMutableArray *output = [NSMutableArray array];
|
|
44
|
-
for (Detection &detection : nms_output) {
|
|
45
|
-
[output addObject:detectionToNSDictionary(detection)];
|
|
46
|
-
}
|
|
47
|
-
|
|
48
|
-
return output;
|
|
49
|
-
}
|
|
50
|
-
|
|
51
|
-
- (NSArray *)runModel:(cv::Mat)input {
|
|
52
|
-
cv::Size size = input.size();
|
|
53
|
-
int inputImageWidth = size.width;
|
|
54
|
-
int inputImageHeight = size.height;
|
|
55
|
-
NSArray *modelInput = [self preprocess:input];
|
|
56
|
-
NSArray *forwardResult = [self forward:@[ modelInput ]];
|
|
57
|
-
NSArray *output =
|
|
58
|
-
[self postprocess:forwardResult
|
|
59
|
-
widthRatio:inputImageWidth / (float)modelInputWidth
|
|
60
|
-
heightRatio:inputImageHeight / (float)modelInputHeight];
|
|
61
|
-
return output;
|
|
62
|
-
}
|
|
63
|
-
|
|
64
|
-
@end
|
|
@@ -1,101 +0,0 @@
|
|
|
1
|
-
#import "Detector.h"
|
|
2
|
-
#import "../../utils/ImageProcessor.h"
|
|
3
|
-
#import "utils/Constants.h"
|
|
4
|
-
#import "utils/DetectorUtils.h"
|
|
5
|
-
#import "utils/OCRUtils.h"
|
|
6
|
-
|
|
7
|
-
/*
|
|
8
|
-
The model used as detector is based on CRAFT (Character Region Awareness for
|
|
9
|
-
Text Detection) paper. https://arxiv.org/pdf/1904.01941
|
|
10
|
-
*/
|
|
11
|
-
|
|
12
|
-
@implementation Detector {
|
|
13
|
-
cv::Size originalSize;
|
|
14
|
-
cv::Size modelSize;
|
|
15
|
-
}
|
|
16
|
-
|
|
17
|
-
- (cv::Size)getModelImageSize {
|
|
18
|
-
if (!modelSize.empty()) {
|
|
19
|
-
return modelSize;
|
|
20
|
-
}
|
|
21
|
-
|
|
22
|
-
NSArray *inputShape = [module getInputShape:@0];
|
|
23
|
-
NSNumber *widthNumber = inputShape[inputShape.count - 2];
|
|
24
|
-
NSNumber *heightNumber = inputShape.lastObject;
|
|
25
|
-
|
|
26
|
-
const int height = [heightNumber intValue];
|
|
27
|
-
const int width = [widthNumber intValue];
|
|
28
|
-
modelSize = cv::Size(height, width);
|
|
29
|
-
|
|
30
|
-
return cv::Size(height, width);
|
|
31
|
-
}
|
|
32
|
-
|
|
33
|
-
- (NSArray *)preprocess:(cv::Mat &)input {
|
|
34
|
-
/*
|
|
35
|
-
Detector as an input accepts tensor with a shape of [1, 3, 800, 800].
|
|
36
|
-
Due to big influence of resize to quality of recognition the image preserves
|
|
37
|
-
original aspect ratio and the missing parts are filled with padding.
|
|
38
|
-
*/
|
|
39
|
-
self->originalSize = cv::Size(input.cols, input.rows);
|
|
40
|
-
cv::Size modelImageSize = [self getModelImageSize];
|
|
41
|
-
cv::Mat resizedImage;
|
|
42
|
-
resizedImage = [OCRUtils resizeWithPadding:input
|
|
43
|
-
desiredWidth:modelImageSize.width
|
|
44
|
-
desiredHeight:modelImageSize.height];
|
|
45
|
-
NSArray *modelInput = [ImageProcessor matToNSArray:resizedImage
|
|
46
|
-
mean:mean
|
|
47
|
-
variance:variance];
|
|
48
|
-
return modelInput;
|
|
49
|
-
}
|
|
50
|
-
|
|
51
|
-
- (NSArray *)postprocess:(NSArray *)output {
|
|
52
|
-
/*
|
|
53
|
-
The output of the model consists of two matrices (heat maps):
|
|
54
|
-
1. ScoreText(Score map) - The probability of a region containing character
|
|
55
|
-
2. ScoreAffinity(Affinity map) - affinity between characters, used to to
|
|
56
|
-
group each character into a single instance (sequence) Both matrices are
|
|
57
|
-
400x400
|
|
58
|
-
|
|
59
|
-
The result of this step is a list of bounding boxes that contain text.
|
|
60
|
-
*/
|
|
61
|
-
NSArray *predictions = [output objectAtIndex:0];
|
|
62
|
-
|
|
63
|
-
cv::Size modelImageSize = [self getModelImageSize];
|
|
64
|
-
cv::Mat scoreTextCV, scoreAffinityCV;
|
|
65
|
-
/*
|
|
66
|
-
The output of the model is a matrix in size of input image containing two
|
|
67
|
-
matrices representing heatmap. Those two matrices are in the size of half of
|
|
68
|
-
the input image, that's why the width and height is divided by 2.
|
|
69
|
-
*/
|
|
70
|
-
[DetectorUtils interleavedArrayToMats:predictions
|
|
71
|
-
outputMat1:scoreTextCV
|
|
72
|
-
outputMat2:scoreAffinityCV
|
|
73
|
-
withSize:cv::Size(modelImageSize.width / 2,
|
|
74
|
-
modelImageSize.height / 2)];
|
|
75
|
-
NSArray *bBoxesList = [DetectorUtils getDetBoxesFromTextMap:scoreTextCV
|
|
76
|
-
affinityMap:scoreAffinityCV
|
|
77
|
-
usingTextThreshold:textThreshold
|
|
78
|
-
linkThreshold:linkThreshold
|
|
79
|
-
lowTextThreshold:lowTextThreshold];
|
|
80
|
-
bBoxesList = [DetectorUtils restoreBboxRatio:bBoxesList
|
|
81
|
-
usingRestoreRatio:restoreRatio];
|
|
82
|
-
|
|
83
|
-
bBoxesList = [DetectorUtils groupTextBoxes:bBoxesList
|
|
84
|
-
centerThreshold:centerThreshold
|
|
85
|
-
distanceThreshold:distanceThreshold
|
|
86
|
-
heightThreshold:heightThreshold
|
|
87
|
-
minSideThreshold:minSideThreshold
|
|
88
|
-
maxSideThreshold:maxSideThreshold
|
|
89
|
-
maxWidth:maxWidth];
|
|
90
|
-
|
|
91
|
-
return bBoxesList;
|
|
92
|
-
}
|
|
93
|
-
|
|
94
|
-
- (NSArray *)runModel:(cv::Mat &)input {
|
|
95
|
-
NSArray *modelInput = [self preprocess:input];
|
|
96
|
-
NSArray *modelResult = [self forward:@[ modelInput ]];
|
|
97
|
-
NSArray *result = [self postprocess:modelResult];
|
|
98
|
-
return result;
|
|
99
|
-
}
|
|
100
|
-
|
|
101
|
-
@end
|
|
@@ -1,16 +0,0 @@
|
|
|
1
|
-
#import "opencv2/opencv.hpp"
|
|
2
|
-
|
|
3
|
-
@interface RecognitionHandler : NSObject
|
|
4
|
-
|
|
5
|
-
- (instancetype)initWithSymbols:(NSString *)symbols;
|
|
6
|
-
|
|
7
|
-
- (NSNumber *)loadRecognizers:(NSString *)largeRecognizerPath
|
|
8
|
-
mediumRecognizerPath:(NSString *)mediumRecognizerPath
|
|
9
|
-
smallRecognizerPath:(NSString *)smallRecognizerPath;
|
|
10
|
-
|
|
11
|
-
- (NSArray *)recognize:(NSArray<NSDictionary *> *)bBoxesList
|
|
12
|
-
imgGray:(cv::Mat)imgGray
|
|
13
|
-
desiredWidth:(int)desiredWidth
|
|
14
|
-
desiredHeight:(int)desiredHeight;
|
|
15
|
-
|
|
16
|
-
@end
|
|
@@ -1,135 +0,0 @@
|
|
|
1
|
-
#import "RecognitionHandler.h"
|
|
2
|
-
#import "./utils/CTCLabelConverter.h"
|
|
3
|
-
#import "./utils/Constants.h"
|
|
4
|
-
#import "./utils/OCRUtils.h"
|
|
5
|
-
#import "./utils/RecognizerUtils.h"
|
|
6
|
-
#import "Recognizer.h"
|
|
7
|
-
|
|
8
|
-
/*
|
|
9
|
-
RecognitionHandler class is responsible for loading and choosing the
|
|
10
|
-
appropriate recognizer model based on the input image size, it also handles
|
|
11
|
-
converting the model output to text.
|
|
12
|
-
*/
|
|
13
|
-
|
|
14
|
-
@implementation RecognitionHandler {
|
|
15
|
-
Recognizer *recognizerLarge;
|
|
16
|
-
Recognizer *recognizerMedium;
|
|
17
|
-
Recognizer *recognizerSmall;
|
|
18
|
-
CTCLabelConverter *converter;
|
|
19
|
-
}
|
|
20
|
-
|
|
21
|
-
- (instancetype)initWithSymbols:(NSString *)symbols {
|
|
22
|
-
self = [super init];
|
|
23
|
-
if (self) {
|
|
24
|
-
recognizerLarge = [[Recognizer alloc] init];
|
|
25
|
-
recognizerMedium = [[Recognizer alloc] init];
|
|
26
|
-
recognizerSmall = [[Recognizer alloc] init];
|
|
27
|
-
|
|
28
|
-
converter = [[CTCLabelConverter alloc] initWithCharacters:symbols
|
|
29
|
-
separatorList:@{}];
|
|
30
|
-
}
|
|
31
|
-
return self;
|
|
32
|
-
}
|
|
33
|
-
|
|
34
|
-
- (NSNumber *)loadRecognizers:(NSString *)largeRecognizerPath
|
|
35
|
-
mediumRecognizerPath:(NSString *)mediumRecognizerPath
|
|
36
|
-
smallRecognizerPath:(NSString *)smallRecognizerPath {
|
|
37
|
-
NSArray<Recognizer *> *recognizers =
|
|
38
|
-
@[ recognizerLarge, recognizerMedium, recognizerSmall ];
|
|
39
|
-
|
|
40
|
-
NSArray<NSString *> *paths =
|
|
41
|
-
@[ largeRecognizerPath, mediumRecognizerPath, smallRecognizerPath ];
|
|
42
|
-
|
|
43
|
-
for (NSInteger i = 0; i < recognizers.count; i++) {
|
|
44
|
-
Recognizer *recognizer = recognizers[i];
|
|
45
|
-
NSString *path = paths[i];
|
|
46
|
-
|
|
47
|
-
NSNumber *errorCode = [recognizer loadModel:path];
|
|
48
|
-
if ([errorCode intValue] != 0) {
|
|
49
|
-
return errorCode;
|
|
50
|
-
}
|
|
51
|
-
}
|
|
52
|
-
|
|
53
|
-
return @0;
|
|
54
|
-
}
|
|
55
|
-
|
|
56
|
-
- (NSArray *)runModel:(cv::Mat)croppedImage {
|
|
57
|
-
NSArray *result;
|
|
58
|
-
if (croppedImage.cols >= largeRecognizerWidth) {
|
|
59
|
-
result = [recognizerLarge runModel:croppedImage];
|
|
60
|
-
} else if (croppedImage.cols >= mediumRecognizerWidth) {
|
|
61
|
-
result = [recognizerMedium runModel:croppedImage];
|
|
62
|
-
} else {
|
|
63
|
-
result = [recognizerSmall runModel:croppedImage];
|
|
64
|
-
}
|
|
65
|
-
|
|
66
|
-
return result;
|
|
67
|
-
}
|
|
68
|
-
|
|
69
|
-
- (NSArray *)recognize:(NSArray<NSDictionary *> *)bBoxesList
|
|
70
|
-
imgGray:(cv::Mat)imgGray
|
|
71
|
-
desiredWidth:(int)desiredWidth
|
|
72
|
-
desiredHeight:(int)desiredHeight {
|
|
73
|
-
NSDictionary *ratioAndPadding =
|
|
74
|
-
[RecognizerUtils calculateResizeRatioAndPaddings:imgGray.cols
|
|
75
|
-
height:imgGray.rows
|
|
76
|
-
desiredWidth:desiredWidth
|
|
77
|
-
desiredHeight:desiredHeight];
|
|
78
|
-
const int left = [ratioAndPadding[@"left"] intValue];
|
|
79
|
-
const int top = [ratioAndPadding[@"top"] intValue];
|
|
80
|
-
const CGFloat resizeRatio = [ratioAndPadding[@"resizeRatio"] floatValue];
|
|
81
|
-
imgGray = [OCRUtils resizeWithPadding:imgGray
|
|
82
|
-
desiredWidth:desiredWidth
|
|
83
|
-
desiredHeight:desiredHeight];
|
|
84
|
-
|
|
85
|
-
NSMutableArray *predictions = [NSMutableArray array];
|
|
86
|
-
for (NSDictionary *box in bBoxesList) {
|
|
87
|
-
cv::Mat croppedImage = [RecognizerUtils getCroppedImage:box
|
|
88
|
-
image:imgGray
|
|
89
|
-
modelHeight:recognizerHeight];
|
|
90
|
-
if (croppedImage.empty()) {
|
|
91
|
-
continue;
|
|
92
|
-
}
|
|
93
|
-
croppedImage = [RecognizerUtils normalizeForRecognizer:croppedImage
|
|
94
|
-
adjustContrast:adjustContrast
|
|
95
|
-
isVertical:NO];
|
|
96
|
-
NSArray *result = [self runModel:croppedImage];
|
|
97
|
-
|
|
98
|
-
NSNumber *confidenceScore = [result objectAtIndex:1];
|
|
99
|
-
if ([confidenceScore floatValue] < lowConfidenceThreshold) {
|
|
100
|
-
cv::rotate(croppedImage, croppedImage, cv::ROTATE_180);
|
|
101
|
-
|
|
102
|
-
NSArray *rotatedResult = [self runModel:croppedImage];
|
|
103
|
-
NSNumber *rotatedConfidenceScore = [rotatedResult objectAtIndex:1];
|
|
104
|
-
|
|
105
|
-
if ([rotatedConfidenceScore floatValue] > [confidenceScore floatValue]) {
|
|
106
|
-
result = rotatedResult;
|
|
107
|
-
confidenceScore = rotatedConfidenceScore;
|
|
108
|
-
}
|
|
109
|
-
}
|
|
110
|
-
|
|
111
|
-
NSArray *predIndex = [result objectAtIndex:0];
|
|
112
|
-
NSArray *decodedTexts = [converter decodeGreedy:predIndex
|
|
113
|
-
length:(int)(predIndex.count)];
|
|
114
|
-
|
|
115
|
-
NSMutableArray *bbox = [NSMutableArray arrayWithCapacity:4];
|
|
116
|
-
for (NSValue *coords in box[@"bbox"]) {
|
|
117
|
-
const CGPoint point = [coords CGPointValue];
|
|
118
|
-
[bbox addObject:@{
|
|
119
|
-
@"x" : @((point.x - left) * resizeRatio),
|
|
120
|
-
@"y" : @((point.y - top) * resizeRatio)
|
|
121
|
-
}];
|
|
122
|
-
}
|
|
123
|
-
|
|
124
|
-
NSDictionary *res = @{
|
|
125
|
-
@"text" : decodedTexts[0],
|
|
126
|
-
@"bbox" : bbox,
|
|
127
|
-
@"score" : confidenceScore
|
|
128
|
-
};
|
|
129
|
-
[predictions addObject:res];
|
|
130
|
-
}
|
|
131
|
-
|
|
132
|
-
return predictions;
|
|
133
|
-
}
|
|
134
|
-
|
|
135
|
-
@end
|
|
@@ -1,77 +0,0 @@
|
|
|
1
|
-
#import "Recognizer.h"
|
|
2
|
-
#import "../../utils/ImageProcessor.h"
|
|
3
|
-
#import "RecognizerUtils.h"
|
|
4
|
-
|
|
5
|
-
/*
|
|
6
|
-
The model used as detector is based on CRNN paper.
|
|
7
|
-
https://arxiv.org/pdf/1507.05717
|
|
8
|
-
*/
|
|
9
|
-
|
|
10
|
-
@implementation Recognizer {
|
|
11
|
-
cv::Size originalSize;
|
|
12
|
-
}
|
|
13
|
-
|
|
14
|
-
- (cv::Size)getModelImageSize {
|
|
15
|
-
NSArray *inputShape = [module getInputShape:@0];
|
|
16
|
-
NSNumber *widthNumber = inputShape.lastObject;
|
|
17
|
-
NSNumber *heightNumber = inputShape[inputShape.count - 2];
|
|
18
|
-
|
|
19
|
-
const int height = [heightNumber intValue];
|
|
20
|
-
const int width = [widthNumber intValue];
|
|
21
|
-
return cv::Size(height, width);
|
|
22
|
-
}
|
|
23
|
-
|
|
24
|
-
- (cv::Size)getModelOutputSize {
|
|
25
|
-
NSArray *outputShape = [module getOutputShape:@0];
|
|
26
|
-
NSNumber *widthNumber = outputShape.lastObject;
|
|
27
|
-
NSNumber *heightNumber = outputShape[outputShape.count - 2];
|
|
28
|
-
|
|
29
|
-
const int height = [heightNumber intValue];
|
|
30
|
-
const int width = [widthNumber intValue];
|
|
31
|
-
return cv::Size(height, width);
|
|
32
|
-
}
|
|
33
|
-
|
|
34
|
-
- (NSArray *)preprocess:(cv::Mat &)input {
|
|
35
|
-
return [ImageProcessor matToNSArrayGray:input];
|
|
36
|
-
}
|
|
37
|
-
|
|
38
|
-
- (NSArray *)postprocess:(NSArray *)output {
|
|
39
|
-
const int modelOutputHeight = [self getModelOutputSize].height;
|
|
40
|
-
NSInteger numElements = [output.firstObject count];
|
|
41
|
-
NSInteger numRows = (numElements + modelOutputHeight - 1) / modelOutputHeight;
|
|
42
|
-
cv::Mat resultMat = cv::Mat::zeros(numRows, modelOutputHeight, CV_32F);
|
|
43
|
-
NSInteger counter = 0;
|
|
44
|
-
NSInteger currentRow = 0;
|
|
45
|
-
for (NSNumber *num in output.firstObject) {
|
|
46
|
-
resultMat.at<float>(currentRow, counter) = [num floatValue];
|
|
47
|
-
counter++;
|
|
48
|
-
if (counter >= modelOutputHeight) {
|
|
49
|
-
counter = 0;
|
|
50
|
-
currentRow++;
|
|
51
|
-
}
|
|
52
|
-
}
|
|
53
|
-
|
|
54
|
-
cv::Mat probabilities = [RecognizerUtils softmax:resultMat];
|
|
55
|
-
NSMutableArray *predsNorm =
|
|
56
|
-
[RecognizerUtils sumProbabilityRows:probabilities
|
|
57
|
-
modelOutputHeight:modelOutputHeight];
|
|
58
|
-
probabilities = [RecognizerUtils divideMatrix:probabilities
|
|
59
|
-
byVector:predsNorm];
|
|
60
|
-
NSArray *maxValuesIndices =
|
|
61
|
-
[RecognizerUtils findMaxValuesAndIndices:probabilities];
|
|
62
|
-
const CGFloat confidenceScore =
|
|
63
|
-
[RecognizerUtils computeConfidenceScore:maxValuesIndices[0]
|
|
64
|
-
indicesArray:maxValuesIndices[1]];
|
|
65
|
-
|
|
66
|
-
return @[ maxValuesIndices[1], @(confidenceScore) ];
|
|
67
|
-
}
|
|
68
|
-
|
|
69
|
-
- (NSArray *)runModel:(cv::Mat &)input {
|
|
70
|
-
NSArray *modelInput = [self preprocess:input];
|
|
71
|
-
NSArray *modelResult = [self forward:@[ modelInput ]];
|
|
72
|
-
NSArray *result = [self postprocess:modelResult];
|
|
73
|
-
|
|
74
|
-
return result;
|
|
75
|
-
}
|
|
76
|
-
|
|
77
|
-
@end
|
|
@@ -1,10 +0,0 @@
|
|
|
1
|
-
#import "BaseModel.h"
|
|
2
|
-
#import "opencv2/opencv.hpp"
|
|
3
|
-
|
|
4
|
-
@interface VerticalDetector : BaseModel
|
|
5
|
-
|
|
6
|
-
- (instancetype)initWithDetectSingleCharacters:(BOOL)detectSingleCharacters;
|
|
7
|
-
- (cv::Size)getModelImageSize;
|
|
8
|
-
- (NSArray *)runModel:(cv::Mat &)input;
|
|
9
|
-
|
|
10
|
-
@end
|