react-native-executorch 0.4.9 → 0.5.0-nightly-6f4dd53-20251211
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +77 -71
- package/android/CMakeLists.txt +29 -0
- package/android/build.gradle +76 -13
- package/android/libs/classes.jar +0 -0
- package/android/src/main/cpp/CMakeLists.txt +109 -0
- package/android/src/main/cpp/ETInstallerModule.cpp +76 -0
- package/android/src/main/cpp/ETInstallerModule.h +43 -0
- package/android/src/main/java/com/swmansion/rnexecutorch/ETInstaller.kt +66 -0
- package/android/src/main/java/com/swmansion/rnexecutorch/RnExecutorchPackage.kt +6 -124
- package/common/ada/ada.cpp +17406 -0
- package/common/ada/ada.h +10274 -0
- package/common/pfft/pfft.c +2205 -0
- package/common/pfft/pfft.h +185 -0
- package/common/rnexecutorch/Log.h +489 -0
- package/common/rnexecutorch/RnExecutorchInstaller.cpp +113 -0
- package/common/rnexecutorch/RnExecutorchInstaller.h +87 -0
- package/common/rnexecutorch/TokenizerModule.cpp +52 -0
- package/common/rnexecutorch/TokenizerModule.h +29 -0
- package/common/rnexecutorch/data_processing/FFT.cpp +21 -0
- package/common/rnexecutorch/data_processing/FFT.h +23 -0
- package/common/rnexecutorch/data_processing/FileUtils.h +30 -0
- package/common/rnexecutorch/data_processing/ImageProcessing.cpp +240 -0
- package/common/rnexecutorch/data_processing/ImageProcessing.h +55 -0
- package/common/rnexecutorch/data_processing/Numerical.cpp +111 -0
- package/common/rnexecutorch/data_processing/Numerical.h +77 -0
- package/common/rnexecutorch/data_processing/base64.cpp +110 -0
- package/common/rnexecutorch/data_processing/base64.h +46 -0
- package/common/rnexecutorch/data_processing/dsp.cpp +19 -0
- package/common/rnexecutorch/data_processing/dsp.h +12 -0
- package/common/rnexecutorch/data_processing/gzip.cpp +47 -0
- package/common/rnexecutorch/data_processing/gzip.h +7 -0
- package/common/rnexecutorch/host_objects/JSTensorViewIn.h +12 -0
- package/common/rnexecutorch/host_objects/JSTensorViewOut.h +22 -0
- package/common/rnexecutorch/host_objects/JsiConversions.h +418 -0
- package/common/rnexecutorch/host_objects/ModelHostObject.h +313 -0
- package/common/rnexecutorch/jsi/JsiHostObject.cpp +108 -0
- package/common/rnexecutorch/jsi/JsiHostObject.h +87 -0
- package/common/rnexecutorch/jsi/OwningArrayBuffer.h +57 -0
- package/common/rnexecutorch/jsi/Promise.cpp +20 -0
- package/common/rnexecutorch/jsi/Promise.h +69 -0
- package/common/rnexecutorch/jsi/RuntimeAwareCache.h +58 -0
- package/common/rnexecutorch/jsi/RuntimeLifecycleMonitor.cpp +53 -0
- package/common/rnexecutorch/jsi/RuntimeLifecycleMonitor.h +35 -0
- package/common/rnexecutorch/metaprogramming/ConstructorHelpers.h +133 -0
- package/common/rnexecutorch/metaprogramming/FunctionHelpers.h +50 -0
- package/common/rnexecutorch/metaprogramming/TypeConcepts.h +37 -0
- package/common/rnexecutorch/models/BaseModel.cpp +183 -0
- package/common/rnexecutorch/models/BaseModel.h +61 -0
- package/common/rnexecutorch/models/classification/Classification.cpp +72 -0
- package/common/rnexecutorch/models/classification/Classification.h +31 -0
- package/{ios/RnExecutorch/models/classification/Constants.mm → common/rnexecutorch/models/classification/Constants.h} +7 -2
- package/common/rnexecutorch/models/embeddings/BaseEmbeddings.cpp +19 -0
- package/common/rnexecutorch/models/embeddings/BaseEmbeddings.h +17 -0
- package/common/rnexecutorch/models/embeddings/image/ImageEmbeddings.cpp +45 -0
- package/common/rnexecutorch/models/embeddings/image/ImageEmbeddings.h +28 -0
- package/common/rnexecutorch/models/embeddings/text/TextEmbeddings.cpp +60 -0
- package/common/rnexecutorch/models/embeddings/text/TextEmbeddings.h +31 -0
- package/{ios/RnExecutorch/models/image_segmentation/Constants.mm → common/rnexecutorch/models/image_segmentation/Constants.h} +7 -2
- package/common/rnexecutorch/models/image_segmentation/ImageSegmentation.cpp +168 -0
- package/common/rnexecutorch/models/image_segmentation/ImageSegmentation.h +50 -0
- package/common/rnexecutorch/models/llm/LLM.cpp +98 -0
- package/common/rnexecutorch/models/llm/LLM.h +38 -0
- package/{ios/RnExecutorch/utils/Constants.mm → common/rnexecutorch/models/object_detection/Constants.h} +9 -2
- package/common/rnexecutorch/models/object_detection/ObjectDetection.cpp +82 -0
- package/common/rnexecutorch/models/object_detection/ObjectDetection.h +37 -0
- package/common/rnexecutorch/models/object_detection/Types.h +13 -0
- package/{ios/RnExecutorch/utils/ObjectDetectionUtils.mm → common/rnexecutorch/models/object_detection/Utils.cpp} +17 -35
- package/common/rnexecutorch/models/object_detection/Utils.h +11 -0
- package/common/rnexecutorch/models/ocr/CTCLabelConverter.cpp +88 -0
- package/common/rnexecutorch/models/ocr/CTCLabelConverter.h +29 -0
- package/common/rnexecutorch/models/ocr/Constants.h +41 -0
- package/common/rnexecutorch/models/ocr/Detector.cpp +100 -0
- package/common/rnexecutorch/models/ocr/Detector.h +30 -0
- package/common/rnexecutorch/models/ocr/OCR.cpp +53 -0
- package/common/rnexecutorch/models/ocr/OCR.h +44 -0
- package/common/rnexecutorch/models/ocr/RecognitionHandler.cpp +108 -0
- package/common/rnexecutorch/models/ocr/RecognitionHandler.h +42 -0
- package/common/rnexecutorch/models/ocr/Recognizer.cpp +80 -0
- package/common/rnexecutorch/models/ocr/Recognizer.h +36 -0
- package/common/rnexecutorch/models/ocr/Types.h +35 -0
- package/common/rnexecutorch/models/ocr/utils/DetectorUtils.cpp +710 -0
- package/common/rnexecutorch/models/ocr/utils/DetectorUtils.h +81 -0
- package/common/rnexecutorch/models/ocr/utils/RecognitionHandlerUtils.cpp +159 -0
- package/common/rnexecutorch/models/ocr/utils/RecognitionHandlerUtils.h +72 -0
- package/common/rnexecutorch/models/ocr/utils/RecognizerUtils.cpp +204 -0
- package/common/rnexecutorch/models/ocr/utils/RecognizerUtils.h +71 -0
- package/common/rnexecutorch/models/speech_to_text/SpeechToText.cpp +125 -0
- package/common/rnexecutorch/models/speech_to_text/SpeechToText.h +57 -0
- package/common/rnexecutorch/models/speech_to_text/asr/ASR.cpp +303 -0
- package/common/rnexecutorch/models/speech_to_text/asr/ASR.h +61 -0
- package/common/rnexecutorch/models/speech_to_text/stream/HypothesisBuffer.cpp +82 -0
- package/common/rnexecutorch/models/speech_to_text/stream/HypothesisBuffer.h +25 -0
- package/common/rnexecutorch/models/speech_to_text/stream/OnlineASRProcessor.cpp +99 -0
- package/common/rnexecutorch/models/speech_to_text/stream/OnlineASRProcessor.h +33 -0
- package/common/rnexecutorch/models/speech_to_text/types/DecodingOptions.h +15 -0
- package/common/rnexecutorch/models/speech_to_text/types/GenerationResult.h +12 -0
- package/common/rnexecutorch/models/speech_to_text/types/ProcessResult.h +12 -0
- package/common/rnexecutorch/models/speech_to_text/types/Segment.h +14 -0
- package/common/rnexecutorch/models/speech_to_text/types/Word.h +13 -0
- package/common/rnexecutorch/models/style_transfer/StyleTransfer.cpp +55 -0
- package/common/rnexecutorch/models/style_transfer/StyleTransfer.h +35 -0
- package/common/rnexecutorch/models/text_to_image/Constants.h +9 -0
- package/common/rnexecutorch/models/text_to_image/Decoder.cpp +32 -0
- package/common/rnexecutorch/models/text_to_image/Decoder.h +24 -0
- package/common/rnexecutorch/models/text_to_image/Encoder.cpp +44 -0
- package/common/rnexecutorch/models/text_to_image/Encoder.h +32 -0
- package/common/rnexecutorch/models/text_to_image/Scheduler.cpp +152 -0
- package/common/rnexecutorch/models/text_to_image/Scheduler.h +41 -0
- package/common/rnexecutorch/models/text_to_image/TextToImage.cpp +141 -0
- package/common/rnexecutorch/models/text_to_image/TextToImage.h +64 -0
- package/common/rnexecutorch/models/text_to_image/UNet.cpp +38 -0
- package/common/rnexecutorch/models/text_to_image/UNet.h +28 -0
- package/common/rnexecutorch/models/vertical_ocr/VerticalDetector.cpp +93 -0
- package/common/rnexecutorch/models/vertical_ocr/VerticalDetector.h +49 -0
- package/common/rnexecutorch/models/vertical_ocr/VerticalOCR.cpp +180 -0
- package/common/rnexecutorch/models/vertical_ocr/VerticalOCR.h +85 -0
- package/common/rnexecutorch/models/voice_activity_detection/Constants.h +27 -0
- package/common/rnexecutorch/models/voice_activity_detection/Types.h +12 -0
- package/common/rnexecutorch/models/voice_activity_detection/Utils.cpp +15 -0
- package/common/rnexecutorch/models/voice_activity_detection/Utils.h +13 -0
- package/common/rnexecutorch/models/voice_activity_detection/VoiceActivityDetection.cpp +160 -0
- package/common/rnexecutorch/models/voice_activity_detection/VoiceActivityDetection.h +36 -0
- package/common/rnexecutorch/tests/CMakeLists.txt +30 -0
- package/common/rnexecutorch/tests/LogTest.cpp +530 -0
- package/common/rnexecutorch/tests/NumericalTest.cpp +110 -0
- package/common/rnexecutorch/tests/README.md +37 -0
- package/common/rnexecutorch/threads/GlobalThreadPool.h +84 -0
- package/common/rnexecutorch/threads/HighPerformanceThreadPool.h +364 -0
- package/common/rnexecutorch/threads/utils/ThreadUtils.h +29 -0
- package/common/runner/arange_util.cpp +44 -0
- package/common/runner/arange_util.h +37 -0
- package/common/runner/constants.h +28 -0
- package/common/runner/io_manager.h +240 -0
- package/common/runner/irunner.h +119 -0
- package/common/runner/kernel_includes.h +23 -0
- package/common/runner/runner.cpp +369 -0
- package/common/runner/runner.h +85 -0
- package/common/runner/sampler.cpp +201 -0
- package/common/runner/sampler.h +67 -0
- package/common/runner/stats.h +161 -0
- package/common/runner/text_decoder_runner.cpp +79 -0
- package/common/runner/text_decoder_runner.h +126 -0
- package/common/runner/text_prefiller.cpp +125 -0
- package/common/runner/text_prefiller.h +85 -0
- package/common/runner/text_token_generator.h +205 -0
- package/common/runner/util.h +153 -0
- package/ios/RnExecutorch/ETInstaller.h +8 -0
- package/ios/RnExecutorch/ETInstaller.mm +56 -0
- package/ios/RnExecutorch.xcodeproj/project.pbxproj +73 -23
- package/lib/module/Error.js +3 -0
- package/lib/module/Error.js.map +1 -1
- package/lib/module/common/Logger.js +23 -0
- package/lib/module/common/Logger.js.map +1 -0
- package/lib/module/constants/directories.js +1 -1
- package/lib/module/constants/directories.js.map +1 -1
- package/lib/module/constants/llmDefaults.js +8 -0
- package/lib/module/constants/llmDefaults.js.map +1 -1
- package/lib/module/constants/modelUrls.js +356 -84
- package/lib/module/constants/modelUrls.js.map +1 -1
- package/lib/module/constants/ocr/models.js +181 -286
- package/lib/module/constants/ocr/models.js.map +1 -1
- package/lib/module/constants/ocr/symbols.js +66 -65
- package/lib/module/constants/ocr/symbols.js.map +1 -1
- package/lib/module/controllers/LLMController.js +54 -24
- package/lib/module/controllers/LLMController.js.map +1 -1
- package/lib/module/controllers/OCRController.js +17 -10
- package/lib/module/controllers/OCRController.js.map +1 -1
- package/lib/module/controllers/VerticalOCRController.js +17 -10
- package/lib/module/controllers/VerticalOCRController.js.map +1 -1
- package/lib/module/hooks/computer_vision/useClassification.js +4 -4
- package/lib/module/hooks/computer_vision/useClassification.js.map +1 -1
- package/lib/module/hooks/computer_vision/useImageEmbeddings.js +13 -0
- package/lib/module/hooks/computer_vision/useImageEmbeddings.js.map +1 -0
- package/lib/module/hooks/computer_vision/useImageSegmentation.js +2 -2
- package/lib/module/hooks/computer_vision/useImageSegmentation.js.map +1 -1
- package/lib/module/hooks/computer_vision/useOCR.js +16 -17
- package/lib/module/hooks/computer_vision/useOCR.js.map +1 -1
- package/lib/module/hooks/computer_vision/useObjectDetection.js +3 -3
- package/lib/module/hooks/computer_vision/useObjectDetection.js.map +1 -1
- package/lib/module/hooks/computer_vision/useStyleTransfer.js +3 -3
- package/lib/module/hooks/computer_vision/useStyleTransfer.js.map +1 -1
- package/lib/module/hooks/computer_vision/useTextToImage.js +57 -0
- package/lib/module/hooks/computer_vision/useTextToImage.js.map +1 -0
- package/lib/module/hooks/computer_vision/useVerticalOCR.js +18 -19
- package/lib/module/hooks/computer_vision/useVerticalOCR.js.map +1 -1
- package/lib/module/hooks/general/useExecutorchModule.js +1 -1
- package/lib/module/hooks/general/useExecutorchModule.js.map +1 -1
- package/lib/module/hooks/natural_language_processing/useLLM.js +30 -29
- package/lib/module/hooks/natural_language_processing/useLLM.js.map +1 -1
- package/lib/module/hooks/natural_language_processing/useSpeechToText.js +72 -33
- package/lib/module/hooks/natural_language_processing/useSpeechToText.js.map +1 -1
- package/lib/module/hooks/natural_language_processing/useTextEmbeddings.js +2 -3
- package/lib/module/hooks/natural_language_processing/useTextEmbeddings.js.map +1 -1
- package/lib/module/hooks/natural_language_processing/useTokenizer.js +19 -18
- package/lib/module/hooks/natural_language_processing/useTokenizer.js.map +1 -1
- package/lib/module/hooks/natural_language_processing/useVAD.js +13 -0
- package/lib/module/hooks/natural_language_processing/useVAD.js.map +1 -0
- package/lib/module/hooks/useModule.js +13 -9
- package/lib/module/hooks/useModule.js.map +1 -1
- package/lib/module/index.js +21 -3
- package/lib/module/index.js.map +1 -1
- package/lib/module/modules/BaseModule.js +9 -14
- package/lib/module/modules/BaseModule.js.map +1 -1
- package/lib/module/modules/computer_vision/ClassificationModule.js +11 -6
- package/lib/module/modules/computer_vision/ClassificationModule.js.map +1 -1
- package/lib/module/modules/computer_vision/ImageEmbeddingsModule.js +19 -0
- package/lib/module/modules/computer_vision/ImageEmbeddingsModule.js.map +1 -0
- package/lib/module/modules/computer_vision/ImageSegmentationModule.js +20 -18
- package/lib/module/modules/computer_vision/ImageSegmentationModule.js.map +1 -1
- package/lib/module/modules/computer_vision/OCRModule.js +13 -10
- package/lib/module/modules/computer_vision/OCRModule.js.map +1 -1
- package/lib/module/modules/computer_vision/ObjectDetectionModule.js +11 -6
- package/lib/module/modules/computer_vision/ObjectDetectionModule.js.map +1 -1
- package/lib/module/modules/computer_vision/StyleTransferModule.js +11 -6
- package/lib/module/modules/computer_vision/StyleTransferModule.js.map +1 -1
- package/lib/module/modules/computer_vision/TextToImageModule.js +48 -0
- package/lib/module/modules/computer_vision/TextToImageModule.js.map +1 -0
- package/lib/module/modules/computer_vision/VerticalOCRModule.js +15 -10
- package/lib/module/modules/computer_vision/VerticalOCRModule.js.map +1 -1
- package/lib/module/modules/general/ExecutorchModule.js +8 -34
- package/lib/module/modules/general/ExecutorchModule.js.map +1 -1
- package/lib/module/modules/natural_language_processing/LLMModule.js +25 -24
- package/lib/module/modules/natural_language_processing/LLMModule.js.map +1 -1
- package/lib/module/modules/natural_language_processing/SpeechToTextModule.js +109 -27
- package/lib/module/modules/natural_language_processing/SpeechToTextModule.js.map +1 -1
- package/lib/module/modules/natural_language_processing/TextEmbeddingsModule.js +13 -6
- package/lib/module/modules/natural_language_processing/TextEmbeddingsModule.js.map +1 -1
- package/lib/module/modules/natural_language_processing/TokenizerModule.js +20 -14
- package/lib/module/modules/natural_language_processing/TokenizerModule.js.map +1 -1
- package/lib/module/modules/natural_language_processing/VADModule.js +19 -0
- package/lib/module/modules/natural_language_processing/VADModule.js.map +1 -0
- package/lib/module/native/NativeETInstaller.js +5 -0
- package/lib/module/native/NativeETInstaller.js.map +1 -0
- package/lib/module/native/RnExecutorchModules.js +2 -12
- package/lib/module/native/RnExecutorchModules.js.map +1 -1
- package/lib/module/types/common.js +25 -8
- package/lib/module/types/common.js.map +1 -1
- package/lib/module/types/llm.js.map +1 -1
- package/lib/module/types/stt.js +1 -79
- package/lib/module/types/stt.js.map +1 -1
- package/lib/module/types/vad.js +2 -0
- package/lib/module/types/vad.js.map +1 -0
- package/lib/module/utils/ResourceFetcher.js +275 -114
- package/lib/module/utils/ResourceFetcher.js.map +1 -1
- package/lib/module/utils/ResourceFetcherUtils.js +155 -0
- package/lib/module/utils/ResourceFetcherUtils.js.map +1 -0
- package/lib/module/utils/llm.js +41 -1
- package/lib/module/utils/llm.js.map +1 -1
- package/lib/typescript/Error.d.ts +3 -0
- package/lib/typescript/Error.d.ts.map +1 -1
- package/lib/typescript/common/Logger.d.ts +9 -0
- package/lib/typescript/common/Logger.d.ts.map +1 -0
- package/lib/typescript/constants/llmDefaults.d.ts +1 -0
- package/lib/typescript/constants/llmDefaults.d.ts.map +1 -1
- package/lib/typescript/constants/modelUrls.d.ts +263 -79
- package/lib/typescript/constants/modelUrls.d.ts.map +1 -1
- package/lib/typescript/constants/ocr/models.d.ts +882 -284
- package/lib/typescript/constants/ocr/models.d.ts.map +1 -1
- package/lib/typescript/constants/ocr/symbols.d.ts +1 -1
- package/lib/typescript/constants/ocr/symbols.d.ts.map +1 -1
- package/lib/typescript/controllers/LLMController.d.ts +8 -7
- package/lib/typescript/controllers/LLMController.d.ts.map +1 -1
- package/lib/typescript/controllers/OCRController.d.ts +5 -6
- package/lib/typescript/controllers/OCRController.d.ts.map +1 -1
- package/lib/typescript/controllers/VerticalOCRController.d.ts +5 -6
- package/lib/typescript/controllers/VerticalOCRController.d.ts.map +1 -1
- package/lib/typescript/hooks/computer_vision/useClassification.d.ts +8 -6
- package/lib/typescript/hooks/computer_vision/useClassification.d.ts.map +1 -1
- package/lib/typescript/hooks/computer_vision/useImageEmbeddings.d.ts +16 -0
- package/lib/typescript/hooks/computer_vision/useImageEmbeddings.d.ts.map +1 -0
- package/lib/typescript/hooks/computer_vision/useImageSegmentation.d.ts +5 -3
- package/lib/typescript/hooks/computer_vision/useImageSegmentation.d.ts.map +1 -1
- package/lib/typescript/hooks/computer_vision/useOCR.d.ts +5 -5
- package/lib/typescript/hooks/computer_vision/useOCR.d.ts.map +1 -1
- package/lib/typescript/hooks/computer_vision/useObjectDetection.d.ts +5 -3
- package/lib/typescript/hooks/computer_vision/useObjectDetection.d.ts.map +1 -1
- package/lib/typescript/hooks/computer_vision/useStyleTransfer.d.ts +5 -3
- package/lib/typescript/hooks/computer_vision/useStyleTransfer.d.ts.map +1 -1
- package/lib/typescript/hooks/computer_vision/useTextToImage.d.ts +22 -0
- package/lib/typescript/hooks/computer_vision/useTextToImage.d.ts.map +1 -0
- package/lib/typescript/hooks/computer_vision/useVerticalOCR.d.ts +4 -6
- package/lib/typescript/hooks/computer_vision/useVerticalOCR.d.ts.map +1 -1
- package/lib/typescript/hooks/general/useExecutorchModule.d.ts +1 -1
- package/lib/typescript/hooks/natural_language_processing/useLLM.d.ts +6 -4
- package/lib/typescript/hooks/natural_language_processing/useLLM.d.ts.map +1 -1
- package/lib/typescript/hooks/natural_language_processing/useSpeechToText.d.ts +15 -22
- package/lib/typescript/hooks/natural_language_processing/useSpeechToText.d.ts.map +1 -1
- package/lib/typescript/hooks/natural_language_processing/useTextEmbeddings.d.ts +9 -5
- package/lib/typescript/hooks/natural_language_processing/useTextEmbeddings.d.ts.map +1 -1
- package/lib/typescript/hooks/natural_language_processing/useTokenizer.d.ts +6 -4
- package/lib/typescript/hooks/natural_language_processing/useTokenizer.d.ts.map +1 -1
- package/lib/typescript/hooks/natural_language_processing/useVAD.d.ts +16 -0
- package/lib/typescript/hooks/natural_language_processing/useVAD.d.ts.map +1 -0
- package/lib/typescript/hooks/useModule.d.ts +8 -5
- package/lib/typescript/hooks/useModule.d.ts.map +1 -1
- package/lib/typescript/index.d.ts +26 -3
- package/lib/typescript/index.d.ts.map +1 -1
- package/lib/typescript/modules/BaseModule.d.ts +7 -6
- package/lib/typescript/modules/BaseModule.d.ts.map +1 -1
- package/lib/typescript/modules/computer_vision/ClassificationModule.d.ts +4 -4
- package/lib/typescript/modules/computer_vision/ClassificationModule.d.ts.map +1 -1
- package/lib/typescript/modules/computer_vision/ImageEmbeddingsModule.d.ts +9 -0
- package/lib/typescript/modules/computer_vision/ImageEmbeddingsModule.d.ts.map +1 -0
- package/lib/typescript/modules/computer_vision/ImageSegmentationModule.d.ts +7 -27
- package/lib/typescript/modules/computer_vision/ImageSegmentationModule.d.ts.map +1 -1
- package/lib/typescript/modules/computer_vision/OCRModule.d.ts +8 -7
- package/lib/typescript/modules/computer_vision/OCRModule.d.ts.map +1 -1
- package/lib/typescript/modules/computer_vision/ObjectDetectionModule.d.ts +5 -3
- package/lib/typescript/modules/computer_vision/ObjectDetectionModule.d.ts.map +1 -1
- package/lib/typescript/modules/computer_vision/StyleTransferModule.d.ts +4 -3
- package/lib/typescript/modules/computer_vision/StyleTransferModule.d.ts.map +1 -1
- package/lib/typescript/modules/computer_vision/TextToImageModule.d.ts +16 -0
- package/lib/typescript/modules/computer_vision/TextToImageModule.d.ts.map +1 -0
- package/lib/typescript/modules/computer_vision/VerticalOCRModule.d.ts +7 -8
- package/lib/typescript/modules/computer_vision/VerticalOCRModule.d.ts.map +1 -1
- package/lib/typescript/modules/general/ExecutorchModule.d.ts +4 -7
- package/lib/typescript/modules/general/ExecutorchModule.d.ts.map +1 -1
- package/lib/typescript/modules/natural_language_processing/LLMModule.d.ts +19 -17
- package/lib/typescript/modules/natural_language_processing/LLMModule.d.ts.map +1 -1
- package/lib/typescript/modules/natural_language_processing/SpeechToTextModule.d.ts +17 -13
- package/lib/typescript/modules/natural_language_processing/SpeechToTextModule.d.ts.map +1 -1
- package/lib/typescript/modules/natural_language_processing/TextEmbeddingsModule.d.ts +5 -3
- package/lib/typescript/modules/natural_language_processing/TextEmbeddingsModule.d.ts.map +1 -1
- package/lib/typescript/modules/natural_language_processing/TokenizerModule.d.ts +10 -9
- package/lib/typescript/modules/natural_language_processing/TokenizerModule.d.ts.map +1 -1
- package/lib/typescript/modules/natural_language_processing/VADModule.d.ts +10 -0
- package/lib/typescript/modules/natural_language_processing/VADModule.d.ts.map +1 -0
- package/lib/typescript/native/{NativeStyleTransfer.d.ts → NativeETInstaller.d.ts} +2 -3
- package/lib/typescript/native/NativeETInstaller.d.ts.map +1 -0
- package/lib/typescript/native/RnExecutorchModules.d.ts +3 -23
- package/lib/typescript/native/RnExecutorchModules.d.ts.map +1 -1
- package/lib/typescript/types/common.d.ts +30 -2
- package/lib/typescript/types/common.d.ts.map +1 -1
- package/lib/typescript/types/llm.d.ts +9 -1
- package/lib/typescript/types/llm.d.ts.map +1 -1
- package/lib/typescript/types/stt.d.ts +9 -88
- package/lib/typescript/types/stt.d.ts.map +1 -1
- package/lib/typescript/types/vad.d.ts +5 -0
- package/lib/typescript/types/vad.d.ts.map +1 -0
- package/lib/typescript/utils/ResourceFetcher.d.ts +47 -10
- package/lib/typescript/utils/ResourceFetcher.d.ts.map +1 -1
- package/lib/typescript/utils/ResourceFetcherUtils.d.ts +55 -0
- package/lib/typescript/utils/ResourceFetcherUtils.d.ts.map +1 -0
- package/lib/typescript/utils/llm.d.ts +4 -0
- package/lib/typescript/utils/llm.d.ts.map +1 -1
- package/package.json +32 -68
- package/react-native-executorch.podspec +62 -4
- package/src/Error.ts +3 -0
- package/src/common/Logger.ts +25 -0
- package/src/constants/directories.ts +1 -1
- package/src/constants/llmDefaults.ts +11 -0
- package/src/constants/modelUrls.ts +433 -168
- package/src/constants/ocr/models.ts +826 -395
- package/src/constants/ocr/symbols.ts +66 -65
- package/src/controllers/LLMController.ts +77 -37
- package/src/controllers/OCRController.ts +25 -16
- package/src/controllers/VerticalOCRController.ts +25 -15
- package/src/hooks/computer_vision/useClassification.ts +8 -9
- package/src/hooks/computer_vision/useImageEmbeddings.ts +15 -0
- package/src/hooks/computer_vision/useImageSegmentation.ts +3 -6
- package/src/hooks/computer_vision/useOCR.ts +32 -25
- package/src/hooks/computer_vision/useObjectDetection.ts +4 -7
- package/src/hooks/computer_vision/useStyleTransfer.ts +4 -4
- package/src/hooks/computer_vision/useTextToImage.ts +92 -0
- package/src/hooks/computer_vision/useVerticalOCR.ts +33 -31
- package/src/hooks/general/useExecutorchModule.ts +1 -1
- package/src/hooks/natural_language_processing/useLLM.ts +54 -31
- package/src/hooks/natural_language_processing/useSpeechToText.ts +96 -88
- package/src/hooks/natural_language_processing/useTextEmbeddings.ts +9 -9
- package/src/hooks/natural_language_processing/useTokenizer.ts +21 -21
- package/src/hooks/natural_language_processing/useVAD.ts +15 -0
- package/src/hooks/useModule.ts +23 -13
- package/src/index.ts +126 -0
- package/src/modules/BaseModule.ts +17 -22
- package/src/modules/computer_vision/ClassificationModule.ts +18 -9
- package/src/modules/computer_vision/ImageEmbeddingsModule.ts +26 -0
- package/src/modules/computer_vision/ImageSegmentationModule.ts +34 -26
- package/src/modules/computer_vision/OCRModule.ts +23 -15
- package/src/modules/computer_vision/ObjectDetectionModule.ts +22 -9
- package/src/modules/computer_vision/StyleTransferModule.ts +18 -9
- package/src/modules/computer_vision/TextToImageModule.ts +93 -0
- package/src/modules/computer_vision/VerticalOCRModule.ts +25 -21
- package/src/modules/general/ExecutorchModule.ts +16 -46
- package/src/modules/natural_language_processing/LLMModule.ts +41 -32
- package/src/modules/natural_language_processing/SpeechToTextModule.ts +164 -66
- package/src/modules/natural_language_processing/TextEmbeddingsModule.ts +25 -10
- package/src/modules/natural_language_processing/TokenizerModule.ts +27 -17
- package/src/modules/natural_language_processing/VADModule.ts +27 -0
- package/src/native/NativeETInstaller.ts +8 -0
- package/src/native/RnExecutorchModules.ts +4 -50
- package/src/types/common.ts +40 -12
- package/src/types/llm.ts +10 -0
- package/src/types/stt.ts +87 -90
- package/src/types/vad.ts +4 -0
- package/src/utils/ResourceFetcher.ts +342 -120
- package/src/utils/ResourceFetcherUtils.ts +184 -0
- package/src/utils/llm.ts +65 -1
- package/third-party/android/libs/cpuinfo/arm64-v8a/libcpuinfo.so +0 -0
- package/third-party/android/libs/executorch/arm64-v8a/libexecutorch.so +0 -0
- package/third-party/android/libs/executorch/x86_64/libexecutorch.so +0 -0
- package/third-party/android/libs/opencv/arm64-v8a/libopencv_core.a +0 -0
- package/third-party/android/libs/opencv/arm64-v8a/libopencv_features2d.a +0 -0
- package/third-party/android/libs/opencv/arm64-v8a/libopencv_highgui.a +0 -0
- package/third-party/android/libs/opencv/arm64-v8a/libopencv_imgproc.a +0 -0
- package/third-party/android/libs/opencv/arm64-v8a/libopencv_photo.a +0 -0
- package/third-party/android/libs/opencv/arm64-v8a/libopencv_video.a +0 -0
- package/third-party/android/libs/opencv/x86_64/libopencv_core.a +0 -0
- package/third-party/android/libs/opencv/x86_64/libopencv_features2d.a +0 -0
- package/third-party/android/libs/opencv/x86_64/libopencv_highgui.a +0 -0
- package/third-party/android/libs/opencv/x86_64/libopencv_imgproc.a +0 -0
- package/third-party/android/libs/opencv/x86_64/libopencv_photo.a +0 -0
- package/third-party/android/libs/opencv/x86_64/libopencv_video.a +0 -0
- package/third-party/android/libs/opencv-third-party/arm64-v8a/libkleidicv.a +0 -0
- package/third-party/android/libs/opencv-third-party/arm64-v8a/libkleidicv_hal.a +0 -0
- package/third-party/android/libs/opencv-third-party/arm64-v8a/libkleidicv_thread.a +0 -0
- package/third-party/android/libs/pthreadpool/arm64-v8a/libpthreadpool.so +0 -0
- package/third-party/android/libs/tokenizers-cpp/arm64-v8a/libsentencepiece.a +0 -0
- package/third-party/android/libs/tokenizers-cpp/arm64-v8a/libtokenizers_c.a +0 -0
- package/third-party/android/libs/tokenizers-cpp/arm64-v8a/libtokenizers_cpp.a +0 -0
- package/{ios/ExecutorchLib.xcframework/ios-arm64-simulator/ExecutorchLib.framework/ExecutorchLib → third-party/android/libs/tokenizers-cpp/x86_64/libsentencepiece.a} +0 -0
- package/third-party/android/libs/tokenizers-cpp/x86_64/libtokenizers_c.a +0 -0
- package/third-party/android/libs/tokenizers-cpp/x86_64/libtokenizers_cpp.a +0 -0
- package/third-party/include/c10/macros/Export.h +1 -0
- package/third-party/include/c10/macros/Macros.h +1 -0
- package/third-party/include/c10/util/BFloat16-inl.h +1 -0
- package/third-party/include/c10/util/BFloat16-math.h +266 -0
- package/third-party/include/c10/util/BFloat16.h +1 -0
- package/third-party/include/c10/util/Half-inl.h +1 -0
- package/third-party/include/c10/util/Half.h +8 -0
- package/third-party/include/c10/util/TypeSafeSignMath.h +1 -0
- package/third-party/include/c10/util/bit_cast.h +1 -0
- package/third-party/include/c10/util/complex.h +72 -0
- package/third-party/include/c10/util/complex_math.h +399 -0
- package/third-party/include/c10/util/complex_utils.h +41 -0
- package/third-party/include/c10/util/floating_point_utils.h +1 -0
- package/third-party/include/c10/util/irange.h +107 -0
- package/third-party/include/c10/util/llvmMathExtras.h +866 -0
- package/third-party/include/c10/util/overflows.h +95 -0
- package/third-party/include/c10/util/safe_numerics.h +97 -0
- package/third-party/include/cpuinfo/cpuinfo.h +2305 -0
- package/third-party/include/executorch/ExecuTorch.h +13 -0
- package/third-party/include/executorch/ExecuTorchError.h +90 -0
- package/third-party/include/executorch/ExecuTorchLLM/ExecuTorchLLM.h +12 -0
- package/third-party/include/executorch/ExecuTorchLLM/ExecuTorchLLMConfig.h +56 -0
- package/third-party/include/executorch/ExecuTorchLLM/ExecuTorchLLMError.h +16 -0
- package/third-party/include/executorch/ExecuTorchLLM/ExecuTorchLLMMultimodalRunner.h +227 -0
- package/third-party/include/executorch/ExecuTorchLLM/ExecuTorchLLMTextRunner.h +97 -0
- package/third-party/include/executorch/ExecuTorchLLM/module.modulemap +4 -0
- package/third-party/include/executorch/ExecuTorchLog.h +77 -0
- package/third-party/include/executorch/ExecuTorchModule.h +563 -0
- package/third-party/include/executorch/ExecuTorchTensor.h +1421 -0
- package/third-party/include/executorch/ExecuTorchValue.h +265 -0
- package/third-party/include/executorch/extension/module/bundled_module.h +131 -0
- package/third-party/include/executorch/extension/module/module.h +649 -0
- package/third-party/include/executorch/extension/tensor/tensor.h +14 -0
- package/third-party/include/executorch/extension/tensor/tensor_accessor.h +190 -0
- package/third-party/include/executorch/extension/tensor/tensor_ptr.h +409 -0
- package/third-party/include/executorch/extension/tensor/tensor_ptr_maker.h +653 -0
- package/third-party/include/executorch/extension/threadpool/cpuinfo_utils.h +24 -0
- package/third-party/include/executorch/extension/threadpool/threadpool.h +95 -0
- package/third-party/include/executorch/runtime/backend/backend_execution_context.h +71 -0
- package/third-party/include/executorch/runtime/backend/backend_init_context.h +84 -0
- package/third-party/include/executorch/runtime/backend/backend_option_context.h +34 -0
- package/third-party/include/executorch/runtime/backend/interface.h +227 -0
- package/third-party/include/executorch/runtime/backend/options.h +206 -0
- package/third-party/include/executorch/runtime/core/array_ref.h +235 -0
- package/third-party/include/executorch/runtime/core/data_loader.h +136 -0
- package/third-party/include/executorch/runtime/core/defines.h +20 -0
- package/third-party/include/executorch/runtime/core/error.h +256 -0
- package/third-party/include/executorch/runtime/core/evalue.h +515 -0
- package/third-party/include/executorch/runtime/core/event_tracer.h +580 -0
- package/third-party/include/executorch/runtime/core/event_tracer_hooks.h +332 -0
- package/third-party/include/executorch/runtime/core/event_tracer_hooks_delegate.h +197 -0
- package/third-party/include/executorch/runtime/core/exec_aten/exec_aten.h +170 -0
- package/third-party/include/executorch/runtime/core/exec_aten/util/dim_order_util.h +264 -0
- package/third-party/include/executorch/runtime/core/exec_aten/util/scalar_type_util.h +1313 -0
- package/third-party/include/executorch/runtime/core/exec_aten/util/tensor_dimension_limit.h +21 -0
- package/third-party/include/executorch/runtime/core/exec_aten/util/tensor_shape_to_c_string.h +69 -0
- package/third-party/include/executorch/runtime/core/exec_aten/util/tensor_util.h +1251 -0
- package/third-party/include/executorch/runtime/core/freeable_buffer.h +107 -0
- package/third-party/include/executorch/runtime/core/function_ref.h +100 -0
- package/third-party/include/executorch/runtime/core/hierarchical_allocator.h +107 -0
- package/third-party/include/executorch/runtime/core/memory_allocator.h +208 -0
- package/third-party/include/executorch/runtime/core/named_data_map.h +76 -0
- package/third-party/include/executorch/runtime/core/portable_type/bfloat16.h +27 -0
- package/third-party/include/executorch/runtime/core/portable_type/bfloat16_math.h +14 -0
- package/third-party/include/executorch/runtime/core/portable_type/bits_types.h +83 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/macros/Export.h +1 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/macros/Macros.h +1 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/util/BFloat16-inl.h +1 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/util/BFloat16-math.h +266 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/util/BFloat16.h +1 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/util/Half-inl.h +1 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/util/Half.h +8 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/util/TypeSafeSignMath.h +1 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/util/bit_cast.h +1 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/util/complex.h +72 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/util/complex_math.h +399 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/util/complex_utils.h +41 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/util/floating_point_utils.h +1 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/util/irange.h +107 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/util/llvmMathExtras.h +866 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/util/overflows.h +95 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/util/safe_numerics.h +97 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/torch/headeronly/macros/Export.h +154 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/torch/headeronly/macros/Macros.h +553 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/torch/headeronly/util/BFloat16.h +477 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/torch/headeronly/util/Half.h +781 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/torch/headeronly/util/TypeSafeSignMath.h +141 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/torch/headeronly/util/bit_cast.h +49 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/torch/headeronly/util/complex.h +593 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/torch/headeronly/util/floating_point_utils.h +38 -0
- package/third-party/include/executorch/runtime/core/portable_type/complex.h +21 -0
- package/third-party/include/executorch/runtime/core/portable_type/device.h +70 -0
- package/third-party/include/executorch/runtime/core/portable_type/half.h +27 -0
- package/third-party/include/executorch/runtime/core/portable_type/optional.h +36 -0
- package/third-party/include/executorch/runtime/core/portable_type/qint_types.h +83 -0
- package/third-party/include/executorch/runtime/core/portable_type/scalar.h +110 -0
- package/third-party/include/executorch/runtime/core/portable_type/scalar_type.h +154 -0
- package/third-party/include/executorch/runtime/core/portable_type/string_view.h +29 -0
- package/third-party/include/executorch/runtime/core/portable_type/tensor.h +142 -0
- package/third-party/include/executorch/runtime/core/portable_type/tensor_impl.h +281 -0
- package/third-party/include/executorch/runtime/core/portable_type/tensor_options.h +60 -0
- package/third-party/include/executorch/runtime/core/result.h +258 -0
- package/third-party/include/executorch/runtime/core/span.h +97 -0
- package/third-party/include/executorch/runtime/core/tag.h +90 -0
- package/third-party/include/executorch/runtime/core/tensor_layout.h +79 -0
- package/third-party/include/executorch/runtime/core/tensor_shape_dynamism.h +39 -0
- package/third-party/include/executorch/runtime/executor/memory_manager.h +113 -0
- package/third-party/include/executorch/runtime/executor/merged_data_map.h +142 -0
- package/third-party/include/executorch/runtime/executor/method.h +412 -0
- package/third-party/include/executorch/runtime/executor/method_meta.h +298 -0
- package/third-party/include/executorch/runtime/executor/program.h +309 -0
- package/third-party/include/executorch/runtime/executor/pte_data_map.h +145 -0
- package/third-party/include/executorch/runtime/executor/tensor_parser.h +157 -0
- package/third-party/include/executorch/runtime/kernel/kernel_runtime_context.h +122 -0
- package/third-party/include/executorch/runtime/kernel/operator_registry.h +280 -0
- package/third-party/include/executorch/runtime/platform/abort.h +36 -0
- package/third-party/include/executorch/runtime/platform/assert.h +119 -0
- package/third-party/include/executorch/runtime/platform/clock.h +43 -0
- package/third-party/include/executorch/runtime/platform/compat_unistd.h +75 -0
- package/third-party/include/executorch/runtime/platform/compiler.h +201 -0
- package/third-party/include/executorch/runtime/platform/log.h +177 -0
- package/third-party/include/executorch/runtime/platform/platform.h +259 -0
- package/third-party/include/executorch/runtime/platform/profiler.h +292 -0
- package/third-party/include/executorch/runtime/platform/runtime.h +35 -0
- package/third-party/include/executorch/runtime/platform/system.h +49 -0
- package/third-party/include/executorch/runtime/platform/types.h +24 -0
- package/third-party/include/executorch/schema/extended_header.h +85 -0
- package/third-party/include/headeronly/macros/Export.h +88 -0
- package/third-party/include/opencv2/core/affine.hpp +676 -0
- package/third-party/include/opencv2/core/async.hpp +107 -0
- package/third-party/include/opencv2/core/base.hpp +735 -0
- package/third-party/include/opencv2/core/bindings_utils.hpp +279 -0
- package/third-party/include/opencv2/core/bufferpool.hpp +39 -0
- package/third-party/include/opencv2/core/check.hpp +231 -0
- package/third-party/include/opencv2/core/core.hpp +55 -0
- package/third-party/include/opencv2/core/core_c.h +3261 -0
- package/third-party/include/opencv2/core/cv_cpu_dispatch.h +404 -0
- package/third-party/include/opencv2/core/cv_cpu_helper.h +856 -0
- package/third-party/include/opencv2/core/cvdef.h +1003 -0
- package/third-party/include/opencv2/core/cvstd.hpp +196 -0
- package/third-party/include/opencv2/core/cvstd.inl.hpp +188 -0
- package/third-party/include/opencv2/core/cvstd_wrapper.hpp +187 -0
- package/third-party/include/opencv2/core/detail/async_promise.hpp +73 -0
- package/third-party/include/opencv2/core/detail/dispatch_helper.impl.hpp +48 -0
- package/third-party/include/opencv2/core/detail/exception_ptr.hpp +24 -0
- package/third-party/include/opencv2/core/dualquaternion.hpp +1054 -0
- package/third-party/include/opencv2/core/dualquaternion.inl.hpp +464 -0
- package/third-party/include/opencv2/core/eigen.hpp +405 -0
- package/third-party/include/opencv2/core/fast_math.hpp +433 -0
- package/third-party/include/opencv2/core/hal/hal.hpp +451 -0
- package/third-party/include/opencv2/core/hal/interface.h +191 -0
- package/third-party/include/opencv2/core/hal/intrin.hpp +1222 -0
- package/third-party/include/opencv2/core/hal/intrin_avx.hpp +3378 -0
- package/third-party/include/opencv2/core/hal/intrin_avx512.hpp +3688 -0
- package/third-party/include/opencv2/core/hal/intrin_cpp.hpp +3446 -0
- package/third-party/include/opencv2/core/hal/intrin_forward.hpp +195 -0
- package/third-party/include/opencv2/core/hal/intrin_lasx.hpp +3243 -0
- package/third-party/include/opencv2/core/hal/intrin_lsx.hpp +2671 -0
- package/third-party/include/opencv2/core/hal/intrin_math.hpp +772 -0
- package/third-party/include/opencv2/core/hal/intrin_msa.hpp +1973 -0
- package/third-party/include/opencv2/core/hal/intrin_neon.hpp +2710 -0
- package/third-party/include/opencv2/core/hal/intrin_rvv071.hpp +3452 -0
- package/third-party/include/opencv2/core/hal/intrin_rvv_scalable.hpp +2559 -0
- package/third-party/include/opencv2/core/hal/intrin_sse.hpp +3528 -0
- package/third-party/include/opencv2/core/hal/intrin_sse_em.hpp +175 -0
- package/third-party/include/opencv2/core/hal/intrin_vsx.hpp +1756 -0
- package/third-party/include/opencv2/core/hal/intrin_wasm.hpp +2911 -0
- package/third-party/include/opencv2/core/hal/msa_macros.h +2079 -0
- package/third-party/include/opencv2/core/hal/simd_utils.impl.hpp +313 -0
- package/third-party/include/opencv2/core/mat.hpp +3842 -0
- package/third-party/include/opencv2/core/mat.inl.hpp +2753 -0
- package/third-party/include/opencv2/core/matx.hpp +603 -0
- package/third-party/include/opencv2/core/matx.inl.hpp +1132 -0
- package/third-party/include/opencv2/core/neon_utils.hpp +127 -0
- package/third-party/include/opencv2/core/operations.hpp +610 -0
- package/third-party/include/opencv2/core/optim.hpp +362 -0
- package/third-party/include/opencv2/core/parallel/backend/parallel_for.openmp.hpp +66 -0
- package/third-party/include/opencv2/core/parallel/backend/parallel_for.tbb.hpp +148 -0
- package/third-party/include/opencv2/core/parallel/parallel_backend.hpp +108 -0
- package/third-party/include/opencv2/core/persistence.hpp +1321 -0
- package/third-party/include/opencv2/core/quaternion.hpp +1889 -0
- package/third-party/include/opencv2/core/quaternion.inl.hpp +907 -0
- package/third-party/include/opencv2/core/saturate.hpp +347 -0
- package/third-party/include/opencv2/core/simd_intrinsics.hpp +90 -0
- package/third-party/include/opencv2/core/softfloat.hpp +657 -0
- package/third-party/include/opencv2/core/sse_utils.hpp +861 -0
- package/third-party/include/opencv2/core/traits.hpp +417 -0
- package/third-party/include/opencv2/core/types.hpp +2368 -0
- package/third-party/include/opencv2/core/types_c.h +2064 -0
- package/third-party/include/opencv2/core/utility.hpp +1296 -0
- package/third-party/include/opencv2/core/utils/allocator_stats.hpp +31 -0
- package/third-party/include/opencv2/core/utils/allocator_stats.impl.hpp +111 -0
- package/third-party/include/opencv2/core/utils/filesystem.hpp +91 -0
- package/third-party/include/opencv2/core/utils/fp_control_utils.hpp +70 -0
- package/third-party/include/opencv2/core/utils/instrumentation.hpp +127 -0
- package/third-party/include/opencv2/core/utils/logger.defines.hpp +50 -0
- package/third-party/include/opencv2/core/utils/logger.hpp +258 -0
- package/third-party/include/opencv2/core/utils/logtag.hpp +27 -0
- package/third-party/include/opencv2/core/utils/tls.hpp +230 -0
- package/third-party/include/opencv2/core/utils/trace.hpp +281 -0
- package/third-party/include/opencv2/core/version.hpp +29 -0
- package/third-party/include/opencv2/core/vsx_utils.hpp +1115 -0
- package/third-party/include/opencv2/core.hpp +3699 -0
- package/third-party/include/opencv2/cvconfig.h +155 -0
- package/third-party/include/opencv2/dnn/dnn.hpp +51 -0
- package/third-party/include/opencv2/dnn.hpp +17 -0
- package/third-party/include/opencv2/features2d/features2d.hpp +55 -0
- package/third-party/include/opencv2/features2d/hal/interface.h +32 -0
- package/third-party/include/opencv2/features2d.hpp +1756 -0
- package/third-party/include/opencv2/highgui/highgui.hpp +113 -0
- package/third-party/include/opencv2/highgui.hpp +17 -0
- package/third-party/include/opencv2/imgproc/bindings.hpp +34 -0
- package/third-party/include/opencv2/imgproc/detail/gcgraph.hpp +355 -0
- package/third-party/include/opencv2/imgproc/detail/legacy.hpp +35 -0
- package/third-party/include/opencv2/imgproc/hal/hal.hpp +246 -0
- package/third-party/include/opencv2/imgproc/hal/interface.h +52 -0
- package/third-party/include/opencv2/imgproc/imgproc.hpp +55 -0
- package/third-party/include/opencv2/imgproc/imgproc_c.h +1261 -0
- package/third-party/include/opencv2/imgproc/segmentation.hpp +168 -0
- package/third-party/include/opencv2/imgproc/types_c.h +632 -0
- package/third-party/include/opencv2/imgproc.hpp +5956 -0
- package/third-party/include/opencv2/opencv.hpp +102 -0
- package/third-party/include/opencv2/opencv_modules.hpp +19 -0
- package/third-party/include/opencv2/photo/legacy/constants_c.h +10 -0
- package/third-party/include/opencv2/photo/photo.hpp +55 -0
- package/third-party/include/opencv2/photo.hpp +975 -0
- package/third-party/include/opencv2/video/background_segm.hpp +341 -0
- package/third-party/include/opencv2/video/detail/tracking.detail.hpp +435 -0
- package/third-party/include/opencv2/video/legacy/constants_c.h +15 -0
- package/third-party/include/opencv2/video/tracking.hpp +1014 -0
- package/third-party/include/opencv2/video/video.hpp +55 -0
- package/third-party/include/opencv2/video.hpp +65 -0
- package/third-party/include/pthreadpool/pthreadpool.h +2236 -0
- package/third-party/include/tokenizers-cpp/tokenizers_c.h +61 -0
- package/third-party/include/tokenizers-cpp/tokenizers_cpp.h +118 -0
- package/third-party/include/torch/headeronly/macros/Export.h +154 -0
- package/third-party/include/torch/headeronly/macros/Macros.h +553 -0
- package/third-party/include/torch/headeronly/util/BFloat16.h +477 -0
- package/third-party/include/torch/headeronly/util/Half.h +781 -0
- package/third-party/include/torch/headeronly/util/TypeSafeSignMath.h +141 -0
- package/third-party/include/torch/headeronly/util/bit_cast.h +49 -0
- package/third-party/include/torch/headeronly/util/complex.h +593 -0
- package/third-party/include/torch/headeronly/util/floating_point_utils.h +38 -0
- package/third-party/ios/ExecutorchLib.xcframework/ios-arm64/ExecutorchLib.framework/ExecutorchLib +0 -0
- package/{ios → third-party/ios}/ExecutorchLib.xcframework/ios-arm64/ExecutorchLib.framework/Info.plist +0 -0
- package/third-party/ios/ExecutorchLib.xcframework/ios-arm64-simulator/ExecutorchLib.framework/ExecutorchLib +0 -0
- package/{ios → third-party/ios}/ExecutorchLib.xcframework/ios-arm64-simulator/ExecutorchLib.framework/Info.plist +0 -0
- package/third-party/ios/libs/cpuinfo/libcpuinfo.a +0 -0
- package/third-party/ios/libs/pthreadpool/physical-arm64-release/libpthreadpool.a +0 -0
- package/third-party/ios/libs/pthreadpool/simulator-arm64-debug/libpthreadpool.a +0 -0
- package/third-party/ios/libs/tokenizers-cpp/physical-arm64-release/libsentencepiece.a +0 -0
- package/{ios/ExecutorchLib.xcframework/ios-arm64/ExecutorchLib.framework/ExecutorchLib → third-party/ios/libs/tokenizers-cpp/physical-arm64-release/libtokenizers_c.a} +0 -0
- package/third-party/ios/libs/tokenizers-cpp/physical-arm64-release/libtokenizers_cpp.a +0 -0
- package/third-party/ios/libs/tokenizers-cpp/simulator-arm64-debug/libsentencepiece.a +0 -0
- package/third-party/ios/libs/tokenizers-cpp/simulator-arm64-debug/libtokenizers_c.a +0 -0
- package/third-party/ios/libs/tokenizers-cpp/simulator-arm64-debug/libtokenizers_cpp.a +0 -0
- package/LICENSE +0 -79
- package/android/src/main/java/com/swmansion/rnexecutorch/Classification.kt +0 -64
- package/android/src/main/java/com/swmansion/rnexecutorch/ETModule.kt +0 -90
- package/android/src/main/java/com/swmansion/rnexecutorch/ImageSegmentation.kt +0 -58
- package/android/src/main/java/com/swmansion/rnexecutorch/LLM.kt +0 -63
- package/android/src/main/java/com/swmansion/rnexecutorch/OCR.kt +0 -90
- package/android/src/main/java/com/swmansion/rnexecutorch/ObjectDetection.kt +0 -64
- package/android/src/main/java/com/swmansion/rnexecutorch/SpeechToText.kt +0 -91
- package/android/src/main/java/com/swmansion/rnexecutorch/StyleTransfer.kt +0 -54
- package/android/src/main/java/com/swmansion/rnexecutorch/TextEmbeddings.kt +0 -51
- package/android/src/main/java/com/swmansion/rnexecutorch/Tokenizer.kt +0 -86
- package/android/src/main/java/com/swmansion/rnexecutorch/VerticalOCR.kt +0 -179
- package/android/src/main/java/com/swmansion/rnexecutorch/models/BaseModel.kt +0 -54
- package/android/src/main/java/com/swmansion/rnexecutorch/models/TextEmbeddings/TextEmbeddingsModel.kt +0 -48
- package/android/src/main/java/com/swmansion/rnexecutorch/models/TextEmbeddings/TextEmbeddingsUtils.kt +0 -37
- package/android/src/main/java/com/swmansion/rnexecutorch/models/classification/ClassificationModel.kt +0 -46
- package/android/src/main/java/com/swmansion/rnexecutorch/models/classification/Constants.kt +0 -1005
- package/android/src/main/java/com/swmansion/rnexecutorch/models/imageSegmentation/Constants.kt +0 -26
- package/android/src/main/java/com/swmansion/rnexecutorch/models/imageSegmentation/ImageSegmentationModel.kt +0 -142
- package/android/src/main/java/com/swmansion/rnexecutorch/models/objectDetection/SSDLiteLargeModel.kt +0 -74
- package/android/src/main/java/com/swmansion/rnexecutorch/models/ocr/Detector.kt +0 -82
- package/android/src/main/java/com/swmansion/rnexecutorch/models/ocr/RecognitionHandler.kt +0 -117
- package/android/src/main/java/com/swmansion/rnexecutorch/models/ocr/Recognizer.kt +0 -51
- package/android/src/main/java/com/swmansion/rnexecutorch/models/ocr/VerticalDetector.kt +0 -89
- package/android/src/main/java/com/swmansion/rnexecutorch/models/ocr/utils/CTCLabelConverter.kt +0 -58
- package/android/src/main/java/com/swmansion/rnexecutorch/models/ocr/utils/Constants.kt +0 -31
- package/android/src/main/java/com/swmansion/rnexecutorch/models/ocr/utils/DetectorUtils.kt +0 -608
- package/android/src/main/java/com/swmansion/rnexecutorch/models/ocr/utils/RecognizerUtils.kt +0 -430
- package/android/src/main/java/com/swmansion/rnexecutorch/models/speechToText/BaseS2TDecoder.kt +0 -39
- package/android/src/main/java/com/swmansion/rnexecutorch/models/speechToText/BaseS2TModule.kt +0 -43
- package/android/src/main/java/com/swmansion/rnexecutorch/models/speechToText/Moonshine.kt +0 -16
- package/android/src/main/java/com/swmansion/rnexecutorch/models/speechToText/MoonshineDecoder.kt +0 -23
- package/android/src/main/java/com/swmansion/rnexecutorch/models/speechToText/MoonshineEncoder.kt +0 -20
- package/android/src/main/java/com/swmansion/rnexecutorch/models/speechToText/Whisper.kt +0 -16
- package/android/src/main/java/com/swmansion/rnexecutorch/models/speechToText/WhisperDecoder.kt +0 -22
- package/android/src/main/java/com/swmansion/rnexecutorch/models/speechToText/WhisperEncoder.kt +0 -29
- package/android/src/main/java/com/swmansion/rnexecutorch/models/styleTransfer/StyleTransferModel.kt +0 -43
- package/android/src/main/java/com/swmansion/rnexecutorch/utils/ArrayUtils.kt +0 -87
- package/android/src/main/java/com/swmansion/rnexecutorch/utils/ETError.kt +0 -34
- package/android/src/main/java/com/swmansion/rnexecutorch/utils/ImageProcessor.kt +0 -237
- package/android/src/main/java/com/swmansion/rnexecutorch/utils/Numerical.kt +0 -8
- package/android/src/main/java/com/swmansion/rnexecutorch/utils/ObjectDetectionUtils.kt +0 -201
- package/android/src/main/java/com/swmansion/rnexecutorch/utils/STFT.kt +0 -50
- package/android/src/main/java/com/swmansion/rnexecutorch/utils/TensorUtils.kt +0 -103
- package/ios/ExecutorchLib.xcframework/ios-arm64/ExecutorchLib.framework/Headers/ETModel.h +0 -27
- package/ios/ExecutorchLib.xcframework/ios-arm64/ExecutorchLib.framework/Headers/HuggingFaceTokenizer.h +0 -14
- package/ios/ExecutorchLib.xcframework/ios-arm64/ExecutorchLib.framework/Headers/LLaMARunner.h +0 -32
- package/ios/ExecutorchLib.xcframework/ios-arm64-simulator/ExecutorchLib.framework/Headers/ETModel.h +0 -27
- package/ios/ExecutorchLib.xcframework/ios-arm64-simulator/ExecutorchLib.framework/Headers/HuggingFaceTokenizer.h +0 -14
- package/ios/ExecutorchLib.xcframework/ios-arm64-simulator/ExecutorchLib.framework/Headers/LLaMARunner.h +0 -32
- package/ios/RnExecutorch/Classification.h +0 -5
- package/ios/RnExecutorch/Classification.mm +0 -54
- package/ios/RnExecutorch/ETModule.h +0 -5
- package/ios/RnExecutorch/ETModule.mm +0 -75
- package/ios/RnExecutorch/ImageSegmentation.h +0 -5
- package/ios/RnExecutorch/ImageSegmentation.mm +0 -60
- package/ios/RnExecutorch/LLM.h +0 -5
- package/ios/RnExecutorch/LLM.mm +0 -78
- package/ios/RnExecutorch/OCR.h +0 -5
- package/ios/RnExecutorch/OCR.mm +0 -96
- package/ios/RnExecutorch/ObjectDetection.h +0 -5
- package/ios/RnExecutorch/ObjectDetection.mm +0 -56
- package/ios/RnExecutorch/SpeechToText.h +0 -5
- package/ios/RnExecutorch/SpeechToText.mm +0 -125
- package/ios/RnExecutorch/StyleTransfer.h +0 -5
- package/ios/RnExecutorch/StyleTransfer.mm +0 -55
- package/ios/RnExecutorch/TextEmbeddings.h +0 -5
- package/ios/RnExecutorch/TextEmbeddings.mm +0 -62
- package/ios/RnExecutorch/Tokenizer.h +0 -5
- package/ios/RnExecutorch/Tokenizer.mm +0 -83
- package/ios/RnExecutorch/VerticalOCR.h +0 -5
- package/ios/RnExecutorch/VerticalOCR.mm +0 -183
- package/ios/RnExecutorch/models/BaseModel.h +0 -21
- package/ios/RnExecutorch/models/BaseModel.mm +0 -43
- package/ios/RnExecutorch/models/classification/ClassificationModel.h +0 -10
- package/ios/RnExecutorch/models/classification/ClassificationModel.mm +0 -53
- package/ios/RnExecutorch/models/classification/Constants.h +0 -3
- package/ios/RnExecutorch/models/image_segmentation/Constants.h +0 -4
- package/ios/RnExecutorch/models/image_segmentation/ImageSegmentationModel.h +0 -10
- package/ios/RnExecutorch/models/image_segmentation/ImageSegmentationModel.mm +0 -146
- package/ios/RnExecutorch/models/object_detection/SSDLiteLargeModel.hpp +0 -11
- package/ios/RnExecutorch/models/object_detection/SSDLiteLargeModel.mm +0 -64
- package/ios/RnExecutorch/models/ocr/Detector.h +0 -9
- package/ios/RnExecutorch/models/ocr/Detector.mm +0 -101
- package/ios/RnExecutorch/models/ocr/RecognitionHandler.h +0 -16
- package/ios/RnExecutorch/models/ocr/RecognitionHandler.mm +0 -135
- package/ios/RnExecutorch/models/ocr/Recognizer.h +0 -8
- package/ios/RnExecutorch/models/ocr/Recognizer.mm +0 -77
- package/ios/RnExecutorch/models/ocr/VerticalDetector.h +0 -10
- package/ios/RnExecutorch/models/ocr/VerticalDetector.mm +0 -118
- package/ios/RnExecutorch/models/ocr/utils/CTCLabelConverter.h +0 -16
- package/ios/RnExecutorch/models/ocr/utils/CTCLabelConverter.mm +0 -80
- package/ios/RnExecutorch/models/ocr/utils/Constants.h +0 -26
- package/ios/RnExecutorch/models/ocr/utils/DetectorUtils.h +0 -31
- package/ios/RnExecutorch/models/ocr/utils/DetectorUtils.mm +0 -754
- package/ios/RnExecutorch/models/ocr/utils/OCRUtils.h +0 -10
- package/ios/RnExecutorch/models/ocr/utils/OCRUtils.mm +0 -67
- package/ios/RnExecutorch/models/ocr/utils/RecognizerUtils.h +0 -35
- package/ios/RnExecutorch/models/ocr/utils/RecognizerUtils.mm +0 -331
- package/ios/RnExecutorch/models/stt/Moonshine.hpp +0 -13
- package/ios/RnExecutorch/models/stt/Moonshine.mm +0 -64
- package/ios/RnExecutorch/models/stt/MoonshineDecoder.hpp +0 -16
- package/ios/RnExecutorch/models/stt/MoonshineDecoder.mm +0 -24
- package/ios/RnExecutorch/models/stt/MoonshineEncoder.hpp +0 -15
- package/ios/RnExecutorch/models/stt/MoonshineEncoder.mm +0 -18
- package/ios/RnExecutorch/models/stt/SpeechToTextBaseModel.hpp +0 -26
- package/ios/RnExecutorch/models/stt/SpeechToTextBaseModel.mm +0 -19
- package/ios/RnExecutorch/models/stt/Whisper.hpp +0 -12
- package/ios/RnExecutorch/models/stt/Whisper.mm +0 -68
- package/ios/RnExecutorch/models/stt/WhisperDecoder.hpp +0 -16
- package/ios/RnExecutorch/models/stt/WhisperDecoder.mm +0 -22
- package/ios/RnExecutorch/models/stt/WhisperEncoder.hpp +0 -15
- package/ios/RnExecutorch/models/stt/WhisperEncoder.mm +0 -21
- package/ios/RnExecutorch/models/style_transfer/StyleTransferModel.h +0 -11
- package/ios/RnExecutorch/models/style_transfer/StyleTransferModel.mm +0 -50
- package/ios/RnExecutorch/models/text_embeddings/TextEmbeddingsModel.h +0 -15
- package/ios/RnExecutorch/models/text_embeddings/TextEmbeddingsModel.mm +0 -45
- package/ios/RnExecutorch/models/text_embeddings/TextEmbeddingsUtils.h +0 -8
- package/ios/RnExecutorch/models/text_embeddings/TextEmbeddingsUtils.mm +0 -49
- package/ios/RnExecutorch/utils/Constants.h +0 -8
- package/ios/RnExecutorch/utils/Conversions.h +0 -15
- package/ios/RnExecutorch/utils/ETError.h +0 -26
- package/ios/RnExecutorch/utils/ImageProcessor.h +0 -15
- package/ios/RnExecutorch/utils/ImageProcessor.mm +0 -147
- package/ios/RnExecutorch/utils/Numerical.h +0 -1
- package/ios/RnExecutorch/utils/Numerical.mm +0 -18
- package/ios/RnExecutorch/utils/ObjectDetectionUtils.hpp +0 -23
- package/ios/RnExecutorch/utils/SFFT.hpp +0 -13
- package/ios/RnExecutorch/utils/SFFT.mm +0 -71
- package/ios/RnExecutorch/utils/ScalarType.h +0 -14
- package/ios/RnExecutorch/utils/ScalarType.mm +0 -21
- package/lib/module/constants/sttDefaults.js +0 -72
- package/lib/module/constants/sttDefaults.js.map +0 -1
- package/lib/module/controllers/SpeechToTextController.js +0 -307
- package/lib/module/controllers/SpeechToTextController.js.map +0 -1
- package/lib/module/native/NativeClassification.js +0 -5
- package/lib/module/native/NativeClassification.js.map +0 -1
- package/lib/module/native/NativeETModule.js +0 -5
- package/lib/module/native/NativeETModule.js.map +0 -1
- package/lib/module/native/NativeImageSegmentation.js +0 -5
- package/lib/module/native/NativeImageSegmentation.js.map +0 -1
- package/lib/module/native/NativeLLM.js +0 -5
- package/lib/module/native/NativeLLM.js.map +0 -1
- package/lib/module/native/NativeOCR.js +0 -5
- package/lib/module/native/NativeOCR.js.map +0 -1
- package/lib/module/native/NativeObjectDetection.js +0 -5
- package/lib/module/native/NativeObjectDetection.js.map +0 -1
- package/lib/module/native/NativeSpeechToText.js +0 -5
- package/lib/module/native/NativeSpeechToText.js.map +0 -1
- package/lib/module/native/NativeStyleTransfer.js +0 -5
- package/lib/module/native/NativeStyleTransfer.js.map +0 -1
- package/lib/module/native/NativeTextEmbeddings.js +0 -5
- package/lib/module/native/NativeTextEmbeddings.js.map +0 -1
- package/lib/module/native/NativeTokenizer.js +0 -5
- package/lib/module/native/NativeTokenizer.js.map +0 -1
- package/lib/module/native/NativeVerticalOCR.js +0 -5
- package/lib/module/native/NativeVerticalOCR.js.map +0 -1
- package/lib/module/package.json +0 -1
- package/lib/module/utils/stt.js +0 -22
- package/lib/module/utils/stt.js.map +0 -1
- package/lib/typescript/constants/sttDefaults.d.ts +0 -28
- package/lib/typescript/constants/sttDefaults.d.ts.map +0 -1
- package/lib/typescript/controllers/SpeechToTextController.d.ts +0 -52
- package/lib/typescript/controllers/SpeechToTextController.d.ts.map +0 -1
- package/lib/typescript/native/NativeClassification.d.ts +0 -10
- package/lib/typescript/native/NativeClassification.d.ts.map +0 -1
- package/lib/typescript/native/NativeETModule.d.ts +0 -9
- package/lib/typescript/native/NativeETModule.d.ts.map +0 -1
- package/lib/typescript/native/NativeImageSegmentation.d.ts +0 -10
- package/lib/typescript/native/NativeImageSegmentation.d.ts.map +0 -1
- package/lib/typescript/native/NativeLLM.d.ts +0 -12
- package/lib/typescript/native/NativeLLM.d.ts.map +0 -1
- package/lib/typescript/native/NativeOCR.d.ts +0 -9
- package/lib/typescript/native/NativeOCR.d.ts.map +0 -1
- package/lib/typescript/native/NativeObjectDetection.d.ts +0 -9
- package/lib/typescript/native/NativeObjectDetection.d.ts.map +0 -1
- package/lib/typescript/native/NativeSpeechToText.d.ts +0 -12
- package/lib/typescript/native/NativeSpeechToText.d.ts.map +0 -1
- package/lib/typescript/native/NativeStyleTransfer.d.ts.map +0 -1
- package/lib/typescript/native/NativeTextEmbeddings.d.ts +0 -8
- package/lib/typescript/native/NativeTextEmbeddings.d.ts.map +0 -1
- package/lib/typescript/native/NativeTokenizer.d.ts +0 -12
- package/lib/typescript/native/NativeTokenizer.d.ts.map +0 -1
- package/lib/typescript/native/NativeVerticalOCR.d.ts +0 -9
- package/lib/typescript/native/NativeVerticalOCR.d.ts.map +0 -1
- package/lib/typescript/utils/stt.d.ts +0 -2
- package/lib/typescript/utils/stt.d.ts.map +0 -1
- package/src/constants/sttDefaults.ts +0 -86
- package/src/controllers/SpeechToTextController.ts +0 -458
- package/src/index.tsx +0 -47
- package/src/native/NativeClassification.ts +0 -9
- package/src/native/NativeETModule.ts +0 -14
- package/src/native/NativeImageSegmentation.ts +0 -14
- package/src/native/NativeLLM.ts +0 -14
- package/src/native/NativeOCR.ts +0 -16
- package/src/native/NativeObjectDetection.ts +0 -10
- package/src/native/NativeSpeechToText.ts +0 -17
- package/src/native/NativeStyleTransfer.ts +0 -10
- package/src/native/NativeTextEmbeddings.ts +0 -9
- package/src/native/NativeTokenizer.ts +0 -13
- package/src/native/NativeVerticalOCR.ts +0 -16
- package/src/utils/stt.ts +0 -28
- package/{ios → third-party/ios}/ExecutorchLib.xcframework/Info.plist +4 -4
|
@@ -1,68 +0,0 @@
|
|
|
1
|
-
#import "Whisper.hpp"
|
|
2
|
-
#import "WhisperEncoder.hpp"
|
|
3
|
-
#import "Whisperdecoder.hpp"
|
|
4
|
-
|
|
5
|
-
@implementation Whisper {
|
|
6
|
-
WhisperEncoder *encoder;
|
|
7
|
-
WhisperDecoder *decoder;
|
|
8
|
-
NSNumber *START_TOKEN;
|
|
9
|
-
NSNumber *EOS_TOKEN;
|
|
10
|
-
NSArray *encoderLastHiddenState;
|
|
11
|
-
int maxSeqLen;
|
|
12
|
-
}
|
|
13
|
-
|
|
14
|
-
- (instancetype)init {
|
|
15
|
-
self = [super init];
|
|
16
|
-
if (self) {
|
|
17
|
-
START_TOKEN = @50257;
|
|
18
|
-
EOS_TOKEN = @50256;
|
|
19
|
-
maxSeqLen = 512;
|
|
20
|
-
}
|
|
21
|
-
return self;
|
|
22
|
-
}
|
|
23
|
-
|
|
24
|
-
- (NSArray *)encode:(NSArray *)waveform {
|
|
25
|
-
self->encoderLastHiddenState = [self->encoder encode:waveform];
|
|
26
|
-
|
|
27
|
-
if (!self->encoderLastHiddenState) {
|
|
28
|
-
[NSException raise:@"forward_error" format:nil];
|
|
29
|
-
}
|
|
30
|
-
return self->encoderLastHiddenState;
|
|
31
|
-
}
|
|
32
|
-
|
|
33
|
-
- (NSArray *)decode:(NSArray *)prevTokens
|
|
34
|
-
encoderLastHiddenState:(NSArray *)encoderLastHiddenState {
|
|
35
|
-
if ([encoderLastHiddenState count] > 0) {
|
|
36
|
-
return [self->decoder decode:prevTokens
|
|
37
|
-
encoderLastHiddenState:encoderLastHiddenState];
|
|
38
|
-
}
|
|
39
|
-
return [self->decoder
|
|
40
|
-
decode:prevTokens
|
|
41
|
-
encoderLastHiddenState:[NSMutableArray
|
|
42
|
-
arrayWithObject:self->encoderLastHiddenState]];
|
|
43
|
-
}
|
|
44
|
-
|
|
45
|
-
- (void)loadModules:(NSArray *)modelSources {
|
|
46
|
-
|
|
47
|
-
self->encoder = [[WhisperEncoder alloc] init];
|
|
48
|
-
self->decoder = [[WhisperDecoder alloc] init];
|
|
49
|
-
|
|
50
|
-
// Load encoder after preprocessor
|
|
51
|
-
[self loadModuleHelper:self->encoder
|
|
52
|
-
withSource:[modelSources objectAtIndex:0]
|
|
53
|
-
onSuccess:^{
|
|
54
|
-
// Load decoder after encoder
|
|
55
|
-
[self loadModuleHelper:self->decoder
|
|
56
|
-
withSource:[modelSources objectAtIndex:1]
|
|
57
|
-
onSuccess:^{
|
|
58
|
-
}
|
|
59
|
-
onFailure:^(NSString *errorCode) {
|
|
60
|
-
[NSException raise:@"init_decoder_error" format:@"%d", errorCode];
|
|
61
|
-
}];
|
|
62
|
-
}
|
|
63
|
-
onFailure:^(NSString *errorCode) {
|
|
64
|
-
[NSException raise:@"init_encoder_error" format:@"%d", errorCode];
|
|
65
|
-
}];
|
|
66
|
-
}
|
|
67
|
-
|
|
68
|
-
@end
|
|
@@ -1,16 +0,0 @@
|
|
|
1
|
-
#ifndef WhisperDecoder_hpp
|
|
2
|
-
#define WhisperDecoder_hpp
|
|
3
|
-
|
|
4
|
-
#import "../BaseModel.h"
|
|
5
|
-
#import "ExecutorchLib/ETModel.h"
|
|
6
|
-
#import <Foundation/Foundation.h>
|
|
7
|
-
#import <UIKit/UIKit.h>
|
|
8
|
-
|
|
9
|
-
@interface WhisperDecoder : BaseModel
|
|
10
|
-
|
|
11
|
-
- (NSArray *)decode:(NSArray *)prevTokens
|
|
12
|
-
encoderLastHiddenState:(NSArray *)encoderLastHiddenState;
|
|
13
|
-
|
|
14
|
-
@end
|
|
15
|
-
|
|
16
|
-
#endif /* WhisperDecoder_hpp */
|
|
@@ -1,22 +0,0 @@
|
|
|
1
|
-
#import "WhisperDecoder.hpp"
|
|
2
|
-
#import "../../utils/ScalarType.h"
|
|
3
|
-
|
|
4
|
-
NSNumber *encoderLastHiddenStateType = ScalarType.Float;
|
|
5
|
-
NSNumber *prevTokensType = ScalarType.Int32;
|
|
6
|
-
NSArray *decoderInputTypes = @[ prevTokensType, encoderLastHiddenStateType ];
|
|
7
|
-
NSArray *encoderLastHiddenStateShape = @[ @1, @1500, @384 ];
|
|
8
|
-
|
|
9
|
-
@implementation WhisperDecoder
|
|
10
|
-
|
|
11
|
-
- (NSArray *)decode:(NSArray *)prevTokens
|
|
12
|
-
encoderLastHiddenState:(NSArray *)encoderLastHiddenState {
|
|
13
|
-
NSNumber *tokensCount = @([prevTokens count]);
|
|
14
|
-
NSArray *prevTokensShape = @[ @1, tokensCount ];
|
|
15
|
-
NSArray *predictedToken =
|
|
16
|
-
[self forward:@[ prevTokens, encoderLastHiddenState ]
|
|
17
|
-
shapes:@[ prevTokensShape, encoderLastHiddenStateShape ]
|
|
18
|
-
inputTypes:decoderInputTypes];
|
|
19
|
-
return [[predictedToken objectAtIndex:0] lastObject];
|
|
20
|
-
}
|
|
21
|
-
|
|
22
|
-
@end
|
|
@@ -1,15 +0,0 @@
|
|
|
1
|
-
#ifndef WhisperEncoder_hpp
|
|
2
|
-
#define WhisperEncoder_hpp
|
|
3
|
-
|
|
4
|
-
#import "../BaseModel.h"
|
|
5
|
-
#import "ExecutorchLib/ETModel.h"
|
|
6
|
-
#import <Foundation/Foundation.h>
|
|
7
|
-
#import <UIKit/UIKit.h>
|
|
8
|
-
|
|
9
|
-
@interface WhisperEncoder : BaseModel
|
|
10
|
-
|
|
11
|
-
- (NSArray *)encode:(NSArray *)waveform;
|
|
12
|
-
|
|
13
|
-
@end
|
|
14
|
-
|
|
15
|
-
#endif /* WhisperEncoder_hpp */
|
|
@@ -1,21 +0,0 @@
|
|
|
1
|
-
#import "WhisperEncoder.hpp"
|
|
2
|
-
#import "../../utils/SFFT.hpp"
|
|
3
|
-
#import "../../utils/ScalarType.h"
|
|
4
|
-
|
|
5
|
-
NSArray *spectrogramInputType = [NSArray arrayWithObject:ScalarType.Float];
|
|
6
|
-
NSNumber *fftFrameSize = @256;
|
|
7
|
-
|
|
8
|
-
@implementation WhisperEncoder
|
|
9
|
-
|
|
10
|
-
- (NSArray *)encode:(NSArray *)waveform {
|
|
11
|
-
NSArray *stft = [SFFT sfftFromWaveform:waveform fftSize:512 fftHopLength:160];
|
|
12
|
-
NSNumber *numFrames = [NSNumber numberWithDouble:([stft count] / 256)];
|
|
13
|
-
NSArray *inputShape = @[ @[ numFrames, fftFrameSize ] ];
|
|
14
|
-
NSArray *result = [self forward:@[ stft ]
|
|
15
|
-
shapes:inputShape
|
|
16
|
-
inputTypes:spectrogramInputType];
|
|
17
|
-
// unsquezing before the return, since forward returns an array of results;
|
|
18
|
-
return [result objectAtIndex:0];
|
|
19
|
-
}
|
|
20
|
-
|
|
21
|
-
@end
|
|
@@ -1,11 +0,0 @@
|
|
|
1
|
-
#import "../BaseModel.h"
|
|
2
|
-
#import "opencv2/opencv.hpp"
|
|
3
|
-
|
|
4
|
-
@interface StyleTransferModel : BaseModel
|
|
5
|
-
|
|
6
|
-
- (cv::Size)getModelImageSize;
|
|
7
|
-
- (NSArray *)preprocess:(cv::Mat &)input;
|
|
8
|
-
- (cv::Mat)postprocess:(NSArray *)output;
|
|
9
|
-
- (cv::Mat)runModel:(cv::Mat &)input;
|
|
10
|
-
|
|
11
|
-
@end
|
|
@@ -1,50 +0,0 @@
|
|
|
1
|
-
#import "StyleTransferModel.h"
|
|
2
|
-
#import "../../utils/ImageProcessor.h"
|
|
3
|
-
|
|
4
|
-
@implementation StyleTransferModel {
|
|
5
|
-
cv::Size originalSize;
|
|
6
|
-
}
|
|
7
|
-
|
|
8
|
-
- (cv::Size)getModelImageSize {
|
|
9
|
-
NSArray *inputShape = [module getInputShape:@0];
|
|
10
|
-
NSNumber *widthNumber = inputShape.lastObject;
|
|
11
|
-
NSNumber *heightNumber = inputShape[inputShape.count - 2];
|
|
12
|
-
|
|
13
|
-
int height = [heightNumber intValue];
|
|
14
|
-
int width = [widthNumber intValue];
|
|
15
|
-
|
|
16
|
-
return cv::Size(height, width);
|
|
17
|
-
}
|
|
18
|
-
|
|
19
|
-
- (NSArray *)preprocess:(cv::Mat &)input {
|
|
20
|
-
self->originalSize = cv::Size(input.cols, input.rows);
|
|
21
|
-
|
|
22
|
-
cv::Size modelImageSize = [self getModelImageSize];
|
|
23
|
-
cv::Mat output;
|
|
24
|
-
cv::resize(input, output, modelImageSize);
|
|
25
|
-
|
|
26
|
-
NSArray *modelInput = [ImageProcessor matToNSArray:output];
|
|
27
|
-
return modelInput;
|
|
28
|
-
}
|
|
29
|
-
|
|
30
|
-
- (cv::Mat)postprocess:(NSArray *)output {
|
|
31
|
-
cv::Size modelImageSize = [self getModelImageSize];
|
|
32
|
-
cv::Mat processedImage = [ImageProcessor arrayToMat:output
|
|
33
|
-
width:modelImageSize.width
|
|
34
|
-
height:modelImageSize.height];
|
|
35
|
-
|
|
36
|
-
cv::Mat processedOutput;
|
|
37
|
-
cv::resize(processedImage, processedOutput, originalSize);
|
|
38
|
-
|
|
39
|
-
return processedOutput;
|
|
40
|
-
}
|
|
41
|
-
|
|
42
|
-
- (cv::Mat)runModel:(cv::Mat &)input {
|
|
43
|
-
NSArray *modelInput = [self preprocess:input];
|
|
44
|
-
NSArray *result = [self forward:@[ modelInput ]];
|
|
45
|
-
input = [self postprocess:result[0]];
|
|
46
|
-
|
|
47
|
-
return input;
|
|
48
|
-
}
|
|
49
|
-
|
|
50
|
-
@end
|
|
@@ -1,15 +0,0 @@
|
|
|
1
|
-
#import "BaseModel.h"
|
|
2
|
-
#import "ExecutorchLib/HuggingFaceTokenizer.h"
|
|
3
|
-
|
|
4
|
-
@interface TextEmbeddingsModel : BaseModel {
|
|
5
|
-
@protected
|
|
6
|
-
HuggingFaceTokenizer *tokenizer;
|
|
7
|
-
}
|
|
8
|
-
|
|
9
|
-
- (void)loadTokenizer:(NSString *)tokenizerSource;
|
|
10
|
-
- (NSArray *)preprocess:(NSString *)input;
|
|
11
|
-
- (NSArray *)runModel:(NSString *)input;
|
|
12
|
-
- (NSArray *)postprocess:(NSArray *)input
|
|
13
|
-
attentionMask:(NSArray *)attentionMask;
|
|
14
|
-
|
|
15
|
-
@end
|
|
@@ -1,45 +0,0 @@
|
|
|
1
|
-
#import "TextEmbeddingsModel.h"
|
|
2
|
-
#import "TextEmbeddingsUtils.h"
|
|
3
|
-
|
|
4
|
-
@implementation TextEmbeddingsModel
|
|
5
|
-
|
|
6
|
-
- (NSArray *)preprocess:(NSString *)input {
|
|
7
|
-
NSArray *input_ids = [self->tokenizer encode:input];
|
|
8
|
-
NSMutableArray *attention_mask = [NSMutableArray new];
|
|
9
|
-
for (int i = 0; i < [input_ids count]; i++) {
|
|
10
|
-
[attention_mask addObject:@((int)([input_ids[i] intValue] != 0))];
|
|
11
|
-
}
|
|
12
|
-
return @[ input_ids, attention_mask ]; // [2, tokens]
|
|
13
|
-
}
|
|
14
|
-
|
|
15
|
-
- (NSArray *)postprocess:(NSArray *)modelOutput // [tokens * embedding_dim]
|
|
16
|
-
attentionMask:(NSArray *)attentionMask // [tokens]
|
|
17
|
-
{
|
|
18
|
-
NSArray *embeddings = [TextEmbeddingsUtils meanPooling:modelOutput
|
|
19
|
-
attentionMask:attentionMask];
|
|
20
|
-
return [TextEmbeddingsUtils normalize:embeddings];
|
|
21
|
-
}
|
|
22
|
-
|
|
23
|
-
- (NSArray *)runModel:(NSString *)input {
|
|
24
|
-
NSArray *modelInput = [self preprocess:input];
|
|
25
|
-
|
|
26
|
-
NSMutableArray *inputTypes = [NSMutableArray arrayWithObjects:@4, @4, nil];
|
|
27
|
-
NSMutableArray *shapes = [NSMutableArray new];
|
|
28
|
-
|
|
29
|
-
NSNumber *tokenCount = @([modelInput[0] count]);
|
|
30
|
-
for (__unused id _ in modelInput) {
|
|
31
|
-
[shapes addObject:[NSMutableArray arrayWithObjects:@1, tokenCount, nil]];
|
|
32
|
-
}
|
|
33
|
-
|
|
34
|
-
NSArray *modelOutput = [self forward:modelInput
|
|
35
|
-
shapes:shapes
|
|
36
|
-
inputTypes:inputTypes];
|
|
37
|
-
return [self postprocess:modelOutput[0] attentionMask:modelInput[1]];
|
|
38
|
-
}
|
|
39
|
-
|
|
40
|
-
- (void)loadTokenizer:(NSString *)tokenizerSource {
|
|
41
|
-
tokenizer =
|
|
42
|
-
[[HuggingFaceTokenizer alloc] initWithTokenizerPath:tokenizerSource];
|
|
43
|
-
}
|
|
44
|
-
|
|
45
|
-
@end
|
|
@@ -1,49 +0,0 @@
|
|
|
1
|
-
#import "TextEmbeddingsUtils.h"
|
|
2
|
-
|
|
3
|
-
@implementation TextEmbeddingsUtils
|
|
4
|
-
|
|
5
|
-
+ (NSArray *)meanPooling:(NSArray *)modelOutput
|
|
6
|
-
attentionMask:(NSArray *)attentionMask {
|
|
7
|
-
NSInteger modelOutputLength = [modelOutput count];
|
|
8
|
-
NSInteger attentionMaskLength = [attentionMask count];
|
|
9
|
-
NSInteger embeddingDim = modelOutputLength / attentionMaskLength;
|
|
10
|
-
|
|
11
|
-
NSMutableArray *result = [NSMutableArray arrayWithCapacity:embeddingDim];
|
|
12
|
-
|
|
13
|
-
double sumMask = 0.0;
|
|
14
|
-
for (NSNumber *maskValue in attentionMask) {
|
|
15
|
-
sumMask += [maskValue intValue];
|
|
16
|
-
}
|
|
17
|
-
sumMask = fmax(sumMask, 1e-9);
|
|
18
|
-
|
|
19
|
-
for (NSInteger i = 0; i < embeddingDim; i++) {
|
|
20
|
-
double sum = 0;
|
|
21
|
-
for (NSInteger j = 0; j < attentionMaskLength; j++) {
|
|
22
|
-
sum += [modelOutput[j * embeddingDim + i] doubleValue] *
|
|
23
|
-
[attentionMask[j] intValue];
|
|
24
|
-
}
|
|
25
|
-
[result addObject:@(sum / sumMask)];
|
|
26
|
-
}
|
|
27
|
-
|
|
28
|
-
return result;
|
|
29
|
-
}
|
|
30
|
-
|
|
31
|
-
+ (NSArray *)normalize:(NSArray *)embeddings {
|
|
32
|
-
NSInteger embeddingDim = [embeddings count];
|
|
33
|
-
double sum = 0.0;
|
|
34
|
-
|
|
35
|
-
for (NSNumber *value in embeddings) {
|
|
36
|
-
sum += [value doubleValue] * [value doubleValue];
|
|
37
|
-
}
|
|
38
|
-
sum = fmax(sqrt(sum), 1e-9);
|
|
39
|
-
|
|
40
|
-
NSMutableArray *normalizedResult =
|
|
41
|
-
[NSMutableArray arrayWithCapacity:embeddingDim];
|
|
42
|
-
for (NSNumber *value in embeddings) {
|
|
43
|
-
[normalizedResult addObject:@([value doubleValue] / sum)];
|
|
44
|
-
}
|
|
45
|
-
|
|
46
|
-
return normalizedResult;
|
|
47
|
-
}
|
|
48
|
-
|
|
49
|
-
@end
|
|
@@ -1,15 +0,0 @@
|
|
|
1
|
-
#import "opencv2/opencv.hpp"
|
|
2
|
-
|
|
3
|
-
// Convert a matrix containing a single value per cell to a NSArray
|
|
4
|
-
template <typename T>
|
|
5
|
-
NSArray* simpleMatToNSArray(const cv::Mat& mat) {
|
|
6
|
-
std::size_t numPixels = mat.rows * mat.cols;
|
|
7
|
-
NSMutableArray *arr = [[NSMutableArray alloc] initWithCapacity:numPixels];
|
|
8
|
-
|
|
9
|
-
for (std::size_t x = 0; x < mat.rows; ++x) {
|
|
10
|
-
for (std::size_t y = 0; y < mat.cols; ++y) {
|
|
11
|
-
arr[x * mat.cols + y] = @(mat.at<T>(x, y));
|
|
12
|
-
}
|
|
13
|
-
}
|
|
14
|
-
return arr;
|
|
15
|
-
}
|
|
@@ -1,26 +0,0 @@
|
|
|
1
|
-
typedef NS_ENUM(NSUInteger, ETError) {
|
|
2
|
-
UndefinedError = 0x65,
|
|
3
|
-
ModuleNotLoaded = 0x66,
|
|
4
|
-
FileWriteFailed = 0x67,
|
|
5
|
-
InvalidModelSource = 0xff,
|
|
6
|
-
|
|
7
|
-
Ok = 0x00,
|
|
8
|
-
Internal = 0x01,
|
|
9
|
-
InvalidState = 0x02,
|
|
10
|
-
EndOfMethod = 0x03,
|
|
11
|
-
|
|
12
|
-
NotSupported = 0x10,
|
|
13
|
-
NotImplemented = 0x11,
|
|
14
|
-
InvalidArgument = 0x12,
|
|
15
|
-
InvalidType = 0x13,
|
|
16
|
-
OperatorMissing = 0x14,
|
|
17
|
-
|
|
18
|
-
NotFound = 0x20,
|
|
19
|
-
MemoryAllocationFailed = 0x21,
|
|
20
|
-
AccessFailed = 0x22,
|
|
21
|
-
InvalidProgram = 0x23,
|
|
22
|
-
|
|
23
|
-
DelegateInvalidCompatibility = 0x30,
|
|
24
|
-
DelegateMemoryAllocationFailed = 0x31,
|
|
25
|
-
DelegateInvalidHandle = 0x32
|
|
26
|
-
};
|
|
@@ -1,15 +0,0 @@
|
|
|
1
|
-
#import <opencv2/opencv.hpp>
|
|
2
|
-
|
|
3
|
-
@interface ImageProcessor : NSObject
|
|
4
|
-
|
|
5
|
-
+ (NSArray *)matToNSArray:(const cv::Mat &)mat
|
|
6
|
-
mean:(cv::Scalar)mean
|
|
7
|
-
variance:(cv::Scalar)variance;
|
|
8
|
-
+ (NSArray *)matToNSArray:(const cv::Mat &)mat;
|
|
9
|
-
+ (cv::Mat)arrayToMat:(NSArray *)array width:(int)width height:(int)height;
|
|
10
|
-
+ (cv::Mat)arrayToMatGray:(NSArray *)array width:(int)width height:(int)height;
|
|
11
|
-
+ (NSArray *)matToNSArrayGray:(const cv::Mat &)mat;
|
|
12
|
-
+ (NSString *)saveToTempFile:(const cv::Mat &)image;
|
|
13
|
-
+ (cv::Mat)readImage:(NSString *)source;
|
|
14
|
-
|
|
15
|
-
@end
|
|
@@ -1,147 +0,0 @@
|
|
|
1
|
-
#import "ImageProcessor.h"
|
|
2
|
-
#import "ETError.h"
|
|
3
|
-
|
|
4
|
-
@implementation ImageProcessor
|
|
5
|
-
|
|
6
|
-
+ (NSArray *)matToNSArray:(const cv::Mat &)mat {
|
|
7
|
-
return [ImageProcessor matToNSArray:mat
|
|
8
|
-
mean:cv::Scalar(0.0, 0.0, 0.0)
|
|
9
|
-
variance:cv::Scalar(1.0, 1.0, 1.0)];
|
|
10
|
-
}
|
|
11
|
-
|
|
12
|
-
+ (NSArray *)matToNSArray:(const cv::Mat &)mat
|
|
13
|
-
mean:(cv::Scalar)mean
|
|
14
|
-
variance:(cv::Scalar)variance {
|
|
15
|
-
int pixelCount = mat.cols * mat.rows;
|
|
16
|
-
NSMutableArray *floatArray =
|
|
17
|
-
[[NSMutableArray alloc] initWithCapacity:pixelCount * 3];
|
|
18
|
-
for (NSUInteger k = 0; k < pixelCount * 3; k++) {
|
|
19
|
-
[floatArray addObject:@0.0];
|
|
20
|
-
}
|
|
21
|
-
|
|
22
|
-
for (int i = 0; i < pixelCount; i++) {
|
|
23
|
-
int row = i / mat.cols;
|
|
24
|
-
int col = i % mat.cols;
|
|
25
|
-
cv::Vec3b pixel = mat.at<cv::Vec3b>(row, col);
|
|
26
|
-
floatArray[0 * pixelCount + i] =
|
|
27
|
-
@((pixel[0] - mean[0] * 255.0) / (variance[0] * 255.0));
|
|
28
|
-
floatArray[1 * pixelCount + i] =
|
|
29
|
-
@((pixel[1] - mean[1] * 255.0) / (variance[1] * 255.0));
|
|
30
|
-
floatArray[2 * pixelCount + i] =
|
|
31
|
-
@((pixel[2] - mean[2] * 255.0) / (variance[2] * 255.0));
|
|
32
|
-
}
|
|
33
|
-
|
|
34
|
-
return floatArray;
|
|
35
|
-
}
|
|
36
|
-
|
|
37
|
-
+ (NSArray *)matToNSArrayGray:(const cv::Mat &)mat {
|
|
38
|
-
NSMutableArray *pixelArray =
|
|
39
|
-
[[NSMutableArray alloc] initWithCapacity:mat.cols * mat.rows];
|
|
40
|
-
|
|
41
|
-
for (int row = 0; row < mat.rows; row++) {
|
|
42
|
-
for (int col = 0; col < mat.cols; col++) {
|
|
43
|
-
float pixelValue = mat.at<float>(row, col);
|
|
44
|
-
[pixelArray addObject:@(pixelValue)];
|
|
45
|
-
}
|
|
46
|
-
}
|
|
47
|
-
|
|
48
|
-
return pixelArray;
|
|
49
|
-
}
|
|
50
|
-
|
|
51
|
-
+ (cv::Mat)arrayToMat:(NSArray *)array width:(int)width height:(int)height {
|
|
52
|
-
cv::Mat mat(height, width, CV_8UC3);
|
|
53
|
-
|
|
54
|
-
int pixelCount = width * height;
|
|
55
|
-
for (int i = 0; i < pixelCount; i++) {
|
|
56
|
-
int row = i / width;
|
|
57
|
-
int col = i % width;
|
|
58
|
-
float r = 0, g = 0, b = 0;
|
|
59
|
-
|
|
60
|
-
r = [[array objectAtIndex:0 * pixelCount + i] floatValue];
|
|
61
|
-
g = [[array objectAtIndex:1 * pixelCount + i] floatValue];
|
|
62
|
-
b = [[array objectAtIndex:2 * pixelCount + i] floatValue];
|
|
63
|
-
|
|
64
|
-
cv::Vec3b color((uchar)(b * 255), (uchar)(g * 255), (uchar)(r * 255));
|
|
65
|
-
mat.at<cv::Vec3b>(row, col) = color;
|
|
66
|
-
}
|
|
67
|
-
|
|
68
|
-
return mat;
|
|
69
|
-
}
|
|
70
|
-
|
|
71
|
-
+ (cv::Mat)arrayToMatGray:(NSArray *)array width:(int)width height:(int)height {
|
|
72
|
-
cv::Mat mat(height, width, CV_32F);
|
|
73
|
-
|
|
74
|
-
int pixelCount = width * height;
|
|
75
|
-
for (int i = 0; i < pixelCount; i++) {
|
|
76
|
-
int row = i / width;
|
|
77
|
-
int col = i % width;
|
|
78
|
-
float value = [array[i] floatValue];
|
|
79
|
-
mat.at<float>(row, col) = value;
|
|
80
|
-
}
|
|
81
|
-
|
|
82
|
-
return mat;
|
|
83
|
-
}
|
|
84
|
-
|
|
85
|
-
+ (NSString *)saveToTempFile:(const cv::Mat &)image {
|
|
86
|
-
NSString *uniqueID = [[NSUUID UUID] UUIDString];
|
|
87
|
-
NSString *filename =
|
|
88
|
-
[NSString stringWithFormat:@"rn_executorch_%@.png", uniqueID];
|
|
89
|
-
NSString *outputPath =
|
|
90
|
-
[NSTemporaryDirectory() stringByAppendingPathComponent:filename];
|
|
91
|
-
|
|
92
|
-
std::string filePath = [outputPath UTF8String];
|
|
93
|
-
if (!cv::imwrite(filePath, image)) {
|
|
94
|
-
@throw [NSException
|
|
95
|
-
exceptionWithName:@"ImageSaveException"
|
|
96
|
-
reason:[NSString
|
|
97
|
-
stringWithFormat:@"%ld", (long)FileWriteFailed]
|
|
98
|
-
userInfo:nil];
|
|
99
|
-
}
|
|
100
|
-
|
|
101
|
-
return [NSString stringWithFormat:@"file://%@", outputPath];
|
|
102
|
-
}
|
|
103
|
-
|
|
104
|
-
+ (cv::Mat)readImage:(NSString *)source {
|
|
105
|
-
NSURL *url = [NSURL URLWithString:source];
|
|
106
|
-
|
|
107
|
-
cv::Mat inputImage;
|
|
108
|
-
if ([[url scheme] isEqualToString:@"data"]) {
|
|
109
|
-
// base64
|
|
110
|
-
NSArray *parts = [source componentsSeparatedByString:@","];
|
|
111
|
-
if ([parts count] < 2) {
|
|
112
|
-
@throw [NSException
|
|
113
|
-
exceptionWithName:@"readImage_error"
|
|
114
|
-
reason:[NSString
|
|
115
|
-
stringWithFormat:@"%ld", (long)InvalidArgument]
|
|
116
|
-
userInfo:nil];
|
|
117
|
-
}
|
|
118
|
-
NSString *encodedString = parts[1];
|
|
119
|
-
NSData *data = [[NSData alloc]
|
|
120
|
-
initWithBase64EncodedString:encodedString
|
|
121
|
-
options:
|
|
122
|
-
NSDataBase64DecodingIgnoreUnknownCharacters];
|
|
123
|
-
cv::Mat encodedData(1, [data length], CV_8UC1, (void *)data.bytes);
|
|
124
|
-
inputImage = cv::imdecode(encodedData, cv::IMREAD_COLOR);
|
|
125
|
-
} else if ([[url scheme] isEqualToString:@"file"]) {
|
|
126
|
-
// local file
|
|
127
|
-
inputImage = cv::imread([[url path] UTF8String], cv::IMREAD_COLOR);
|
|
128
|
-
} else {
|
|
129
|
-
// external file
|
|
130
|
-
NSData *data = [NSData dataWithContentsOfURL:url];
|
|
131
|
-
inputImage =
|
|
132
|
-
cv::imdecode(cv::Mat(1, [data length], CV_8UC1, (void *)data.bytes),
|
|
133
|
-
cv::IMREAD_COLOR);
|
|
134
|
-
}
|
|
135
|
-
|
|
136
|
-
if (inputImage.empty()) {
|
|
137
|
-
@throw [NSException
|
|
138
|
-
exceptionWithName:@"readImage_error"
|
|
139
|
-
reason:[NSString
|
|
140
|
-
stringWithFormat:@"%ld", (long)InvalidArgument]
|
|
141
|
-
userInfo:nil];
|
|
142
|
-
}
|
|
143
|
-
|
|
144
|
-
return inputImage;
|
|
145
|
-
}
|
|
146
|
-
|
|
147
|
-
@end
|
|
@@ -1 +0,0 @@
|
|
|
1
|
-
std::vector<double> softmax(const std::vector<double> &v);
|
|
@@ -1,18 +0,0 @@
|
|
|
1
|
-
#include "Utils.h"
|
|
2
|
-
|
|
3
|
-
std::vector<double> softmax(const std::vector<double> &v) {
|
|
4
|
-
std::vector<double> result(v.size());
|
|
5
|
-
double maxVal = *std::max_element(v.begin(), v.end());
|
|
6
|
-
|
|
7
|
-
double sumExp = 0.0;
|
|
8
|
-
for (size_t i = 0; i < v.size(); ++i) {
|
|
9
|
-
result[i] = std::exp(v[i] - maxVal);
|
|
10
|
-
sumExp += result[i];
|
|
11
|
-
}
|
|
12
|
-
|
|
13
|
-
for (size_t i = 0; i < v.size(); ++i) {
|
|
14
|
-
result[i] /= sumExp;
|
|
15
|
-
}
|
|
16
|
-
|
|
17
|
-
return result;
|
|
18
|
-
}
|
|
@@ -1,23 +0,0 @@
|
|
|
1
|
-
#ifndef ObjectDetectionUtils_hpp
|
|
2
|
-
#define ObjectDetectionUtils_hpp
|
|
3
|
-
|
|
4
|
-
#import <Foundation/Foundation.h>
|
|
5
|
-
#include <stdio.h>
|
|
6
|
-
#include <vector>
|
|
7
|
-
|
|
8
|
-
struct Detection {
|
|
9
|
-
float x1;
|
|
10
|
-
float y1;
|
|
11
|
-
float x2;
|
|
12
|
-
float y2;
|
|
13
|
-
float label;
|
|
14
|
-
float score;
|
|
15
|
-
};
|
|
16
|
-
|
|
17
|
-
NSString *floatLabelToNSString(float label);
|
|
18
|
-
NSDictionary *detectionToNSDictionary(const Detection &detection);
|
|
19
|
-
float iou(const Detection &a, const Detection &b);
|
|
20
|
-
std::vector<Detection> nms(std::vector<Detection> detections,
|
|
21
|
-
float iouThreshold);
|
|
22
|
-
|
|
23
|
-
#endif /* ObjectDetectionUtils_hpp */
|
|
@@ -1,13 +0,0 @@
|
|
|
1
|
-
#import <Accelerate/Accelerate.h>
|
|
2
|
-
#import <UIKit/UIKit.h>
|
|
3
|
-
|
|
4
|
-
@interface SFFT : NSObject
|
|
5
|
-
|
|
6
|
-
+ (NSArray *)sfftFromWaveform:(NSArray *)waveform
|
|
7
|
-
fftSize:(int)fftSize
|
|
8
|
-
fftHopLength:(int)fftHopLength;
|
|
9
|
-
+ (void)fft:(float *)signal
|
|
10
|
-
fftSetup:(FFTSetup)fftSetup
|
|
11
|
-
fftSize:(int)fftSize
|
|
12
|
-
magnitudes:(NSMutableArray *)magnitudes;
|
|
13
|
-
@end
|
|
@@ -1,71 +0,0 @@
|
|
|
1
|
-
#import "SFFT.hpp"
|
|
2
|
-
|
|
3
|
-
@implementation SFFT
|
|
4
|
-
|
|
5
|
-
+ (NSArray *)sfftFromWaveform:(NSArray *)waveform
|
|
6
|
-
fftSize:(int)fftSize
|
|
7
|
-
fftHopLength:(int)fftHopLength {
|
|
8
|
-
FFTSetup fftSetup = vDSP_create_fftsetup(log2(fftSize), kFFTRadix2);
|
|
9
|
-
if (!fftSetup) {
|
|
10
|
-
NSLog(@"Error creating FFT setup.");
|
|
11
|
-
}
|
|
12
|
-
|
|
13
|
-
// Generate Hann Window coefficients.
|
|
14
|
-
// https://www.mathworks.com/help/signal/ref/hann.html
|
|
15
|
-
float hann[fftSize];
|
|
16
|
-
for (int i = 0; i < fftSize; i++) {
|
|
17
|
-
hann[i] = 0.5 * (1 - cos(2 * M_PI * i / (fftSize - 1)));
|
|
18
|
-
}
|
|
19
|
-
|
|
20
|
-
NSMutableArray *stftResult = [NSMutableArray new];
|
|
21
|
-
int currentIndex = 0;
|
|
22
|
-
while (currentIndex + fftSize <= waveform.count) {
|
|
23
|
-
float signal[fftSize];
|
|
24
|
-
|
|
25
|
-
// Extract signal and apply the Hann window
|
|
26
|
-
for (int i = 0; i < fftSize; i++) {
|
|
27
|
-
signal[i] = [waveform[currentIndex + i] floatValue] * hann[i];
|
|
28
|
-
}
|
|
29
|
-
|
|
30
|
-
[SFFT fft:signal fftSetup:fftSetup magnitudes:stftResult fftSize:fftSize];
|
|
31
|
-
|
|
32
|
-
currentIndex += fftHopLength;
|
|
33
|
-
}
|
|
34
|
-
|
|
35
|
-
vDSP_destroy_fftsetup(fftSetup);
|
|
36
|
-
return stftResult;
|
|
37
|
-
}
|
|
38
|
-
|
|
39
|
-
+ (void)fft:(float *)signal
|
|
40
|
-
fftSetup:(FFTSetup)fftSetup
|
|
41
|
-
magnitudes:(NSMutableArray *)magnitudes
|
|
42
|
-
fftSize:(int)fftSize {
|
|
43
|
-
const int log2n = log2(fftSize);
|
|
44
|
-
DSPSplitComplex a;
|
|
45
|
-
a.realp = (float *)malloc(fftSize / 2 * sizeof(float));
|
|
46
|
-
a.imagp = (float *)malloc(fftSize / 2 * sizeof(float));
|
|
47
|
-
|
|
48
|
-
// Perform the FFT
|
|
49
|
-
vDSP_ctoz((DSPComplex *)signal, 2, &a, 1, fftSize / 2);
|
|
50
|
-
vDSP_fft_zrip(fftSetup, &a, 1, log2n, FFT_FORWARD);
|
|
51
|
-
|
|
52
|
-
// Zero out Nyquist component
|
|
53
|
-
a.imagp[0] = 0.0f;
|
|
54
|
-
|
|
55
|
-
const float magnitudeScale = 1.0f / fftSize;
|
|
56
|
-
for (int i = 0; i < fftSize / 2; ++i) {
|
|
57
|
-
double magnitude = sqrt(a.realp[i] * a.realp[i] + a.imagp[i] * a.imagp[i]) *
|
|
58
|
-
magnitudeScale;
|
|
59
|
-
// FIXME: we don't need that, but if we remove this we have to get rid of
|
|
60
|
-
// reversing this operation in the preprocessing part
|
|
61
|
-
double magnitudeDb = 20 * log10f(magnitude);
|
|
62
|
-
// Push to the result array
|
|
63
|
-
[magnitudes addObject:@(magnitudeDb)];
|
|
64
|
-
}
|
|
65
|
-
|
|
66
|
-
// Cleanup
|
|
67
|
-
free(a.realp);
|
|
68
|
-
free(a.imagp);
|
|
69
|
-
}
|
|
70
|
-
|
|
71
|
-
@end
|