react-native-executorch 0.4.10 → 0.5.0-nightly-6f4dd53-20251211
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +77 -71
- package/android/CMakeLists.txt +29 -0
- package/android/build.gradle +76 -13
- package/android/libs/classes.jar +0 -0
- package/android/src/main/cpp/CMakeLists.txt +109 -0
- package/android/src/main/cpp/ETInstallerModule.cpp +76 -0
- package/android/src/main/cpp/ETInstallerModule.h +43 -0
- package/android/src/main/java/com/swmansion/rnexecutorch/ETInstaller.kt +66 -0
- package/android/src/main/java/com/swmansion/rnexecutorch/RnExecutorchPackage.kt +6 -124
- package/common/ada/ada.cpp +17406 -0
- package/common/ada/ada.h +10274 -0
- package/common/pfft/pfft.c +2205 -0
- package/common/pfft/pfft.h +185 -0
- package/common/rnexecutorch/Log.h +489 -0
- package/common/rnexecutorch/RnExecutorchInstaller.cpp +113 -0
- package/common/rnexecutorch/RnExecutorchInstaller.h +87 -0
- package/common/rnexecutorch/TokenizerModule.cpp +52 -0
- package/common/rnexecutorch/TokenizerModule.h +29 -0
- package/common/rnexecutorch/data_processing/FFT.cpp +21 -0
- package/common/rnexecutorch/data_processing/FFT.h +23 -0
- package/common/rnexecutorch/data_processing/FileUtils.h +30 -0
- package/common/rnexecutorch/data_processing/ImageProcessing.cpp +240 -0
- package/common/rnexecutorch/data_processing/ImageProcessing.h +55 -0
- package/common/rnexecutorch/data_processing/Numerical.cpp +111 -0
- package/common/rnexecutorch/data_processing/Numerical.h +77 -0
- package/common/rnexecutorch/data_processing/base64.cpp +110 -0
- package/common/rnexecutorch/data_processing/base64.h +46 -0
- package/common/rnexecutorch/data_processing/dsp.cpp +19 -0
- package/common/rnexecutorch/data_processing/dsp.h +12 -0
- package/common/rnexecutorch/data_processing/gzip.cpp +47 -0
- package/common/rnexecutorch/data_processing/gzip.h +7 -0
- package/common/rnexecutorch/host_objects/JSTensorViewIn.h +12 -0
- package/common/rnexecutorch/host_objects/JSTensorViewOut.h +22 -0
- package/common/rnexecutorch/host_objects/JsiConversions.h +418 -0
- package/common/rnexecutorch/host_objects/ModelHostObject.h +313 -0
- package/common/rnexecutorch/jsi/JsiHostObject.cpp +108 -0
- package/common/rnexecutorch/jsi/JsiHostObject.h +87 -0
- package/common/rnexecutorch/jsi/OwningArrayBuffer.h +57 -0
- package/common/rnexecutorch/jsi/Promise.cpp +20 -0
- package/common/rnexecutorch/jsi/Promise.h +69 -0
- package/common/rnexecutorch/jsi/RuntimeAwareCache.h +58 -0
- package/common/rnexecutorch/jsi/RuntimeLifecycleMonitor.cpp +53 -0
- package/common/rnexecutorch/jsi/RuntimeLifecycleMonitor.h +35 -0
- package/common/rnexecutorch/metaprogramming/ConstructorHelpers.h +133 -0
- package/common/rnexecutorch/metaprogramming/FunctionHelpers.h +50 -0
- package/common/rnexecutorch/metaprogramming/TypeConcepts.h +37 -0
- package/common/rnexecutorch/models/BaseModel.cpp +183 -0
- package/common/rnexecutorch/models/BaseModel.h +61 -0
- package/common/rnexecutorch/models/classification/Classification.cpp +72 -0
- package/common/rnexecutorch/models/classification/Classification.h +31 -0
- package/{ios/RnExecutorch/models/classification/Constants.mm → common/rnexecutorch/models/classification/Constants.h} +7 -2
- package/common/rnexecutorch/models/embeddings/BaseEmbeddings.cpp +19 -0
- package/common/rnexecutorch/models/embeddings/BaseEmbeddings.h +17 -0
- package/common/rnexecutorch/models/embeddings/image/ImageEmbeddings.cpp +45 -0
- package/common/rnexecutorch/models/embeddings/image/ImageEmbeddings.h +28 -0
- package/common/rnexecutorch/models/embeddings/text/TextEmbeddings.cpp +60 -0
- package/common/rnexecutorch/models/embeddings/text/TextEmbeddings.h +31 -0
- package/{ios/RnExecutorch/models/image_segmentation/Constants.mm → common/rnexecutorch/models/image_segmentation/Constants.h} +7 -2
- package/common/rnexecutorch/models/image_segmentation/ImageSegmentation.cpp +168 -0
- package/common/rnexecutorch/models/image_segmentation/ImageSegmentation.h +50 -0
- package/common/rnexecutorch/models/llm/LLM.cpp +98 -0
- package/common/rnexecutorch/models/llm/LLM.h +38 -0
- package/{ios/RnExecutorch/utils/Constants.mm → common/rnexecutorch/models/object_detection/Constants.h} +9 -2
- package/common/rnexecutorch/models/object_detection/ObjectDetection.cpp +82 -0
- package/common/rnexecutorch/models/object_detection/ObjectDetection.h +37 -0
- package/common/rnexecutorch/models/object_detection/Types.h +13 -0
- package/{ios/RnExecutorch/utils/ObjectDetectionUtils.mm → common/rnexecutorch/models/object_detection/Utils.cpp} +17 -35
- package/common/rnexecutorch/models/object_detection/Utils.h +11 -0
- package/common/rnexecutorch/models/ocr/CTCLabelConverter.cpp +88 -0
- package/common/rnexecutorch/models/ocr/CTCLabelConverter.h +29 -0
- package/common/rnexecutorch/models/ocr/Constants.h +41 -0
- package/common/rnexecutorch/models/ocr/Detector.cpp +100 -0
- package/common/rnexecutorch/models/ocr/Detector.h +30 -0
- package/common/rnexecutorch/models/ocr/OCR.cpp +53 -0
- package/common/rnexecutorch/models/ocr/OCR.h +44 -0
- package/common/rnexecutorch/models/ocr/RecognitionHandler.cpp +108 -0
- package/common/rnexecutorch/models/ocr/RecognitionHandler.h +42 -0
- package/common/rnexecutorch/models/ocr/Recognizer.cpp +80 -0
- package/common/rnexecutorch/models/ocr/Recognizer.h +36 -0
- package/common/rnexecutorch/models/ocr/Types.h +35 -0
- package/common/rnexecutorch/models/ocr/utils/DetectorUtils.cpp +710 -0
- package/common/rnexecutorch/models/ocr/utils/DetectorUtils.h +81 -0
- package/common/rnexecutorch/models/ocr/utils/RecognitionHandlerUtils.cpp +159 -0
- package/common/rnexecutorch/models/ocr/utils/RecognitionHandlerUtils.h +72 -0
- package/common/rnexecutorch/models/ocr/utils/RecognizerUtils.cpp +204 -0
- package/common/rnexecutorch/models/ocr/utils/RecognizerUtils.h +71 -0
- package/common/rnexecutorch/models/speech_to_text/SpeechToText.cpp +125 -0
- package/common/rnexecutorch/models/speech_to_text/SpeechToText.h +57 -0
- package/common/rnexecutorch/models/speech_to_text/asr/ASR.cpp +303 -0
- package/common/rnexecutorch/models/speech_to_text/asr/ASR.h +61 -0
- package/common/rnexecutorch/models/speech_to_text/stream/HypothesisBuffer.cpp +82 -0
- package/common/rnexecutorch/models/speech_to_text/stream/HypothesisBuffer.h +25 -0
- package/common/rnexecutorch/models/speech_to_text/stream/OnlineASRProcessor.cpp +99 -0
- package/common/rnexecutorch/models/speech_to_text/stream/OnlineASRProcessor.h +33 -0
- package/common/rnexecutorch/models/speech_to_text/types/DecodingOptions.h +15 -0
- package/common/rnexecutorch/models/speech_to_text/types/GenerationResult.h +12 -0
- package/common/rnexecutorch/models/speech_to_text/types/ProcessResult.h +12 -0
- package/common/rnexecutorch/models/speech_to_text/types/Segment.h +14 -0
- package/common/rnexecutorch/models/speech_to_text/types/Word.h +13 -0
- package/common/rnexecutorch/models/style_transfer/StyleTransfer.cpp +55 -0
- package/common/rnexecutorch/models/style_transfer/StyleTransfer.h +35 -0
- package/common/rnexecutorch/models/text_to_image/Constants.h +9 -0
- package/common/rnexecutorch/models/text_to_image/Decoder.cpp +32 -0
- package/common/rnexecutorch/models/text_to_image/Decoder.h +24 -0
- package/common/rnexecutorch/models/text_to_image/Encoder.cpp +44 -0
- package/common/rnexecutorch/models/text_to_image/Encoder.h +32 -0
- package/common/rnexecutorch/models/text_to_image/Scheduler.cpp +152 -0
- package/common/rnexecutorch/models/text_to_image/Scheduler.h +41 -0
- package/common/rnexecutorch/models/text_to_image/TextToImage.cpp +141 -0
- package/common/rnexecutorch/models/text_to_image/TextToImage.h +64 -0
- package/common/rnexecutorch/models/text_to_image/UNet.cpp +38 -0
- package/common/rnexecutorch/models/text_to_image/UNet.h +28 -0
- package/common/rnexecutorch/models/vertical_ocr/VerticalDetector.cpp +93 -0
- package/common/rnexecutorch/models/vertical_ocr/VerticalDetector.h +49 -0
- package/common/rnexecutorch/models/vertical_ocr/VerticalOCR.cpp +180 -0
- package/common/rnexecutorch/models/vertical_ocr/VerticalOCR.h +85 -0
- package/common/rnexecutorch/models/voice_activity_detection/Constants.h +27 -0
- package/common/rnexecutorch/models/voice_activity_detection/Types.h +12 -0
- package/common/rnexecutorch/models/voice_activity_detection/Utils.cpp +15 -0
- package/common/rnexecutorch/models/voice_activity_detection/Utils.h +13 -0
- package/common/rnexecutorch/models/voice_activity_detection/VoiceActivityDetection.cpp +160 -0
- package/common/rnexecutorch/models/voice_activity_detection/VoiceActivityDetection.h +36 -0
- package/common/rnexecutorch/tests/CMakeLists.txt +30 -0
- package/common/rnexecutorch/tests/LogTest.cpp +530 -0
- package/common/rnexecutorch/tests/NumericalTest.cpp +110 -0
- package/common/rnexecutorch/tests/README.md +37 -0
- package/common/rnexecutorch/threads/GlobalThreadPool.h +84 -0
- package/common/rnexecutorch/threads/HighPerformanceThreadPool.h +364 -0
- package/common/rnexecutorch/threads/utils/ThreadUtils.h +29 -0
- package/common/runner/arange_util.cpp +44 -0
- package/common/runner/arange_util.h +37 -0
- package/common/runner/constants.h +28 -0
- package/common/runner/io_manager.h +240 -0
- package/common/runner/irunner.h +119 -0
- package/common/runner/kernel_includes.h +23 -0
- package/common/runner/runner.cpp +369 -0
- package/common/runner/runner.h +85 -0
- package/common/runner/sampler.cpp +201 -0
- package/common/runner/sampler.h +67 -0
- package/common/runner/stats.h +161 -0
- package/common/runner/text_decoder_runner.cpp +79 -0
- package/common/runner/text_decoder_runner.h +126 -0
- package/common/runner/text_prefiller.cpp +125 -0
- package/common/runner/text_prefiller.h +85 -0
- package/common/runner/text_token_generator.h +205 -0
- package/common/runner/util.h +153 -0
- package/ios/RnExecutorch/ETInstaller.h +8 -0
- package/ios/RnExecutorch/ETInstaller.mm +56 -0
- package/ios/RnExecutorch.xcodeproj/project.pbxproj +73 -23
- package/lib/module/Error.js +3 -0
- package/lib/module/Error.js.map +1 -1
- package/lib/module/common/Logger.js +23 -0
- package/lib/module/common/Logger.js.map +1 -0
- package/lib/module/constants/directories.js +1 -1
- package/lib/module/constants/directories.js.map +1 -1
- package/lib/module/constants/llmDefaults.js +8 -0
- package/lib/module/constants/llmDefaults.js.map +1 -1
- package/lib/module/constants/modelUrls.js +356 -84
- package/lib/module/constants/modelUrls.js.map +1 -1
- package/lib/module/constants/ocr/models.js +181 -286
- package/lib/module/constants/ocr/models.js.map +1 -1
- package/lib/module/constants/ocr/symbols.js +66 -65
- package/lib/module/constants/ocr/symbols.js.map +1 -1
- package/lib/module/controllers/LLMController.js +53 -23
- package/lib/module/controllers/LLMController.js.map +1 -1
- package/lib/module/controllers/OCRController.js +17 -10
- package/lib/module/controllers/OCRController.js.map +1 -1
- package/lib/module/controllers/VerticalOCRController.js +17 -10
- package/lib/module/controllers/VerticalOCRController.js.map +1 -1
- package/lib/module/hooks/computer_vision/useClassification.js +4 -4
- package/lib/module/hooks/computer_vision/useClassification.js.map +1 -1
- package/lib/module/hooks/computer_vision/useImageEmbeddings.js +13 -0
- package/lib/module/hooks/computer_vision/useImageEmbeddings.js.map +1 -0
- package/lib/module/hooks/computer_vision/useImageSegmentation.js +2 -2
- package/lib/module/hooks/computer_vision/useImageSegmentation.js.map +1 -1
- package/lib/module/hooks/computer_vision/useOCR.js +16 -17
- package/lib/module/hooks/computer_vision/useOCR.js.map +1 -1
- package/lib/module/hooks/computer_vision/useObjectDetection.js +3 -3
- package/lib/module/hooks/computer_vision/useObjectDetection.js.map +1 -1
- package/lib/module/hooks/computer_vision/useStyleTransfer.js +3 -3
- package/lib/module/hooks/computer_vision/useStyleTransfer.js.map +1 -1
- package/lib/module/hooks/computer_vision/useTextToImage.js +57 -0
- package/lib/module/hooks/computer_vision/useTextToImage.js.map +1 -0
- package/lib/module/hooks/computer_vision/useVerticalOCR.js +18 -19
- package/lib/module/hooks/computer_vision/useVerticalOCR.js.map +1 -1
- package/lib/module/hooks/general/useExecutorchModule.js +1 -1
- package/lib/module/hooks/general/useExecutorchModule.js.map +1 -1
- package/lib/module/hooks/natural_language_processing/useLLM.js +30 -29
- package/lib/module/hooks/natural_language_processing/useLLM.js.map +1 -1
- package/lib/module/hooks/natural_language_processing/useSpeechToText.js +72 -33
- package/lib/module/hooks/natural_language_processing/useSpeechToText.js.map +1 -1
- package/lib/module/hooks/natural_language_processing/useTextEmbeddings.js +2 -3
- package/lib/module/hooks/natural_language_processing/useTextEmbeddings.js.map +1 -1
- package/lib/module/hooks/natural_language_processing/useTokenizer.js +19 -18
- package/lib/module/hooks/natural_language_processing/useTokenizer.js.map +1 -1
- package/lib/module/hooks/natural_language_processing/useVAD.js +13 -0
- package/lib/module/hooks/natural_language_processing/useVAD.js.map +1 -0
- package/lib/module/hooks/useModule.js +13 -9
- package/lib/module/hooks/useModule.js.map +1 -1
- package/lib/module/index.js +21 -3
- package/lib/module/index.js.map +1 -1
- package/lib/module/modules/BaseModule.js +9 -14
- package/lib/module/modules/BaseModule.js.map +1 -1
- package/lib/module/modules/computer_vision/ClassificationModule.js +11 -6
- package/lib/module/modules/computer_vision/ClassificationModule.js.map +1 -1
- package/lib/module/modules/computer_vision/ImageEmbeddingsModule.js +19 -0
- package/lib/module/modules/computer_vision/ImageEmbeddingsModule.js.map +1 -0
- package/lib/module/modules/computer_vision/ImageSegmentationModule.js +20 -18
- package/lib/module/modules/computer_vision/ImageSegmentationModule.js.map +1 -1
- package/lib/module/modules/computer_vision/OCRModule.js +13 -10
- package/lib/module/modules/computer_vision/OCRModule.js.map +1 -1
- package/lib/module/modules/computer_vision/ObjectDetectionModule.js +11 -6
- package/lib/module/modules/computer_vision/ObjectDetectionModule.js.map +1 -1
- package/lib/module/modules/computer_vision/StyleTransferModule.js +11 -6
- package/lib/module/modules/computer_vision/StyleTransferModule.js.map +1 -1
- package/lib/module/modules/computer_vision/TextToImageModule.js +48 -0
- package/lib/module/modules/computer_vision/TextToImageModule.js.map +1 -0
- package/lib/module/modules/computer_vision/VerticalOCRModule.js +15 -10
- package/lib/module/modules/computer_vision/VerticalOCRModule.js.map +1 -1
- package/lib/module/modules/general/ExecutorchModule.js +8 -34
- package/lib/module/modules/general/ExecutorchModule.js.map +1 -1
- package/lib/module/modules/natural_language_processing/LLMModule.js +25 -24
- package/lib/module/modules/natural_language_processing/LLMModule.js.map +1 -1
- package/lib/module/modules/natural_language_processing/SpeechToTextModule.js +109 -27
- package/lib/module/modules/natural_language_processing/SpeechToTextModule.js.map +1 -1
- package/lib/module/modules/natural_language_processing/TextEmbeddingsModule.js +13 -6
- package/lib/module/modules/natural_language_processing/TextEmbeddingsModule.js.map +1 -1
- package/lib/module/modules/natural_language_processing/TokenizerModule.js +20 -14
- package/lib/module/modules/natural_language_processing/TokenizerModule.js.map +1 -1
- package/lib/module/modules/natural_language_processing/VADModule.js +19 -0
- package/lib/module/modules/natural_language_processing/VADModule.js.map +1 -0
- package/lib/module/native/NativeETInstaller.js +5 -0
- package/lib/module/native/NativeETInstaller.js.map +1 -0
- package/lib/module/native/RnExecutorchModules.js +2 -12
- package/lib/module/native/RnExecutorchModules.js.map +1 -1
- package/lib/module/types/common.js +25 -8
- package/lib/module/types/common.js.map +1 -1
- package/lib/module/types/llm.js.map +1 -1
- package/lib/module/types/stt.js +1 -79
- package/lib/module/types/stt.js.map +1 -1
- package/lib/module/types/vad.js +2 -0
- package/lib/module/types/vad.js.map +1 -0
- package/lib/module/utils/ResourceFetcher.js +275 -114
- package/lib/module/utils/ResourceFetcher.js.map +1 -1
- package/lib/module/utils/ResourceFetcherUtils.js +155 -0
- package/lib/module/utils/ResourceFetcherUtils.js.map +1 -0
- package/lib/module/utils/llm.js +41 -1
- package/lib/module/utils/llm.js.map +1 -1
- package/lib/typescript/Error.d.ts +3 -0
- package/lib/typescript/Error.d.ts.map +1 -1
- package/lib/typescript/common/Logger.d.ts +9 -0
- package/lib/typescript/common/Logger.d.ts.map +1 -0
- package/lib/typescript/constants/llmDefaults.d.ts +1 -0
- package/lib/typescript/constants/llmDefaults.d.ts.map +1 -1
- package/lib/typescript/constants/modelUrls.d.ts +263 -79
- package/lib/typescript/constants/modelUrls.d.ts.map +1 -1
- package/lib/typescript/constants/ocr/models.d.ts +882 -284
- package/lib/typescript/constants/ocr/models.d.ts.map +1 -1
- package/lib/typescript/constants/ocr/symbols.d.ts +1 -1
- package/lib/typescript/constants/ocr/symbols.d.ts.map +1 -1
- package/lib/typescript/controllers/LLMController.d.ts +8 -7
- package/lib/typescript/controllers/LLMController.d.ts.map +1 -1
- package/lib/typescript/controllers/OCRController.d.ts +5 -6
- package/lib/typescript/controllers/OCRController.d.ts.map +1 -1
- package/lib/typescript/controllers/VerticalOCRController.d.ts +5 -6
- package/lib/typescript/controllers/VerticalOCRController.d.ts.map +1 -1
- package/lib/typescript/hooks/computer_vision/useClassification.d.ts +8 -6
- package/lib/typescript/hooks/computer_vision/useClassification.d.ts.map +1 -1
- package/lib/typescript/hooks/computer_vision/useImageEmbeddings.d.ts +16 -0
- package/lib/typescript/hooks/computer_vision/useImageEmbeddings.d.ts.map +1 -0
- package/lib/typescript/hooks/computer_vision/useImageSegmentation.d.ts +5 -3
- package/lib/typescript/hooks/computer_vision/useImageSegmentation.d.ts.map +1 -1
- package/lib/typescript/hooks/computer_vision/useOCR.d.ts +5 -5
- package/lib/typescript/hooks/computer_vision/useOCR.d.ts.map +1 -1
- package/lib/typescript/hooks/computer_vision/useObjectDetection.d.ts +5 -3
- package/lib/typescript/hooks/computer_vision/useObjectDetection.d.ts.map +1 -1
- package/lib/typescript/hooks/computer_vision/useStyleTransfer.d.ts +5 -3
- package/lib/typescript/hooks/computer_vision/useStyleTransfer.d.ts.map +1 -1
- package/lib/typescript/hooks/computer_vision/useTextToImage.d.ts +22 -0
- package/lib/typescript/hooks/computer_vision/useTextToImage.d.ts.map +1 -0
- package/lib/typescript/hooks/computer_vision/useVerticalOCR.d.ts +4 -6
- package/lib/typescript/hooks/computer_vision/useVerticalOCR.d.ts.map +1 -1
- package/lib/typescript/hooks/general/useExecutorchModule.d.ts +1 -1
- package/lib/typescript/hooks/natural_language_processing/useLLM.d.ts +6 -4
- package/lib/typescript/hooks/natural_language_processing/useLLM.d.ts.map +1 -1
- package/lib/typescript/hooks/natural_language_processing/useSpeechToText.d.ts +15 -22
- package/lib/typescript/hooks/natural_language_processing/useSpeechToText.d.ts.map +1 -1
- package/lib/typescript/hooks/natural_language_processing/useTextEmbeddings.d.ts +9 -5
- package/lib/typescript/hooks/natural_language_processing/useTextEmbeddings.d.ts.map +1 -1
- package/lib/typescript/hooks/natural_language_processing/useTokenizer.d.ts +6 -4
- package/lib/typescript/hooks/natural_language_processing/useTokenizer.d.ts.map +1 -1
- package/lib/typescript/hooks/natural_language_processing/useVAD.d.ts +16 -0
- package/lib/typescript/hooks/natural_language_processing/useVAD.d.ts.map +1 -0
- package/lib/typescript/hooks/useModule.d.ts +8 -5
- package/lib/typescript/hooks/useModule.d.ts.map +1 -1
- package/lib/typescript/index.d.ts +26 -3
- package/lib/typescript/index.d.ts.map +1 -1
- package/lib/typescript/modules/BaseModule.d.ts +7 -6
- package/lib/typescript/modules/BaseModule.d.ts.map +1 -1
- package/lib/typescript/modules/computer_vision/ClassificationModule.d.ts +4 -4
- package/lib/typescript/modules/computer_vision/ClassificationModule.d.ts.map +1 -1
- package/lib/typescript/modules/computer_vision/ImageEmbeddingsModule.d.ts +9 -0
- package/lib/typescript/modules/computer_vision/ImageEmbeddingsModule.d.ts.map +1 -0
- package/lib/typescript/modules/computer_vision/ImageSegmentationModule.d.ts +7 -27
- package/lib/typescript/modules/computer_vision/ImageSegmentationModule.d.ts.map +1 -1
- package/lib/typescript/modules/computer_vision/OCRModule.d.ts +8 -7
- package/lib/typescript/modules/computer_vision/OCRModule.d.ts.map +1 -1
- package/lib/typescript/modules/computer_vision/ObjectDetectionModule.d.ts +5 -3
- package/lib/typescript/modules/computer_vision/ObjectDetectionModule.d.ts.map +1 -1
- package/lib/typescript/modules/computer_vision/StyleTransferModule.d.ts +4 -3
- package/lib/typescript/modules/computer_vision/StyleTransferModule.d.ts.map +1 -1
- package/lib/typescript/modules/computer_vision/TextToImageModule.d.ts +16 -0
- package/lib/typescript/modules/computer_vision/TextToImageModule.d.ts.map +1 -0
- package/lib/typescript/modules/computer_vision/VerticalOCRModule.d.ts +7 -8
- package/lib/typescript/modules/computer_vision/VerticalOCRModule.d.ts.map +1 -1
- package/lib/typescript/modules/general/ExecutorchModule.d.ts +4 -7
- package/lib/typescript/modules/general/ExecutorchModule.d.ts.map +1 -1
- package/lib/typescript/modules/natural_language_processing/LLMModule.d.ts +19 -17
- package/lib/typescript/modules/natural_language_processing/LLMModule.d.ts.map +1 -1
- package/lib/typescript/modules/natural_language_processing/SpeechToTextModule.d.ts +17 -13
- package/lib/typescript/modules/natural_language_processing/SpeechToTextModule.d.ts.map +1 -1
- package/lib/typescript/modules/natural_language_processing/TextEmbeddingsModule.d.ts +5 -3
- package/lib/typescript/modules/natural_language_processing/TextEmbeddingsModule.d.ts.map +1 -1
- package/lib/typescript/modules/natural_language_processing/TokenizerModule.d.ts +10 -9
- package/lib/typescript/modules/natural_language_processing/TokenizerModule.d.ts.map +1 -1
- package/lib/typescript/modules/natural_language_processing/VADModule.d.ts +10 -0
- package/lib/typescript/modules/natural_language_processing/VADModule.d.ts.map +1 -0
- package/lib/typescript/native/{NativeStyleTransfer.d.ts → NativeETInstaller.d.ts} +2 -3
- package/lib/typescript/native/NativeETInstaller.d.ts.map +1 -0
- package/lib/typescript/native/RnExecutorchModules.d.ts +3 -23
- package/lib/typescript/native/RnExecutorchModules.d.ts.map +1 -1
- package/lib/typescript/types/common.d.ts +30 -2
- package/lib/typescript/types/common.d.ts.map +1 -1
- package/lib/typescript/types/llm.d.ts +9 -1
- package/lib/typescript/types/llm.d.ts.map +1 -1
- package/lib/typescript/types/stt.d.ts +9 -88
- package/lib/typescript/types/stt.d.ts.map +1 -1
- package/lib/typescript/types/vad.d.ts +5 -0
- package/lib/typescript/types/vad.d.ts.map +1 -0
- package/lib/typescript/utils/ResourceFetcher.d.ts +47 -10
- package/lib/typescript/utils/ResourceFetcher.d.ts.map +1 -1
- package/lib/typescript/utils/ResourceFetcherUtils.d.ts +55 -0
- package/lib/typescript/utils/ResourceFetcherUtils.d.ts.map +1 -0
- package/lib/typescript/utils/llm.d.ts +4 -0
- package/lib/typescript/utils/llm.d.ts.map +1 -1
- package/package.json +32 -68
- package/react-native-executorch.podspec +62 -4
- package/src/Error.ts +3 -0
- package/src/common/Logger.ts +25 -0
- package/src/constants/directories.ts +1 -1
- package/src/constants/llmDefaults.ts +11 -0
- package/src/constants/modelUrls.ts +433 -168
- package/src/constants/ocr/models.ts +826 -395
- package/src/constants/ocr/symbols.ts +66 -65
- package/src/controllers/LLMController.ts +76 -36
- package/src/controllers/OCRController.ts +25 -16
- package/src/controllers/VerticalOCRController.ts +25 -15
- package/src/hooks/computer_vision/useClassification.ts +8 -9
- package/src/hooks/computer_vision/useImageEmbeddings.ts +15 -0
- package/src/hooks/computer_vision/useImageSegmentation.ts +3 -6
- package/src/hooks/computer_vision/useOCR.ts +32 -25
- package/src/hooks/computer_vision/useObjectDetection.ts +4 -7
- package/src/hooks/computer_vision/useStyleTransfer.ts +4 -4
- package/src/hooks/computer_vision/useTextToImage.ts +92 -0
- package/src/hooks/computer_vision/useVerticalOCR.ts +33 -31
- package/src/hooks/general/useExecutorchModule.ts +1 -1
- package/src/hooks/natural_language_processing/useLLM.ts +54 -31
- package/src/hooks/natural_language_processing/useSpeechToText.ts +96 -88
- package/src/hooks/natural_language_processing/useTextEmbeddings.ts +9 -9
- package/src/hooks/natural_language_processing/useTokenizer.ts +21 -21
- package/src/hooks/natural_language_processing/useVAD.ts +15 -0
- package/src/hooks/useModule.ts +23 -13
- package/src/index.ts +126 -0
- package/src/modules/BaseModule.ts +17 -22
- package/src/modules/computer_vision/ClassificationModule.ts +18 -9
- package/src/modules/computer_vision/ImageEmbeddingsModule.ts +26 -0
- package/src/modules/computer_vision/ImageSegmentationModule.ts +34 -26
- package/src/modules/computer_vision/OCRModule.ts +23 -15
- package/src/modules/computer_vision/ObjectDetectionModule.ts +22 -9
- package/src/modules/computer_vision/StyleTransferModule.ts +18 -9
- package/src/modules/computer_vision/TextToImageModule.ts +93 -0
- package/src/modules/computer_vision/VerticalOCRModule.ts +25 -21
- package/src/modules/general/ExecutorchModule.ts +16 -46
- package/src/modules/natural_language_processing/LLMModule.ts +41 -32
- package/src/modules/natural_language_processing/SpeechToTextModule.ts +164 -66
- package/src/modules/natural_language_processing/TextEmbeddingsModule.ts +25 -10
- package/src/modules/natural_language_processing/TokenizerModule.ts +27 -17
- package/src/modules/natural_language_processing/VADModule.ts +27 -0
- package/src/native/NativeETInstaller.ts +8 -0
- package/src/native/RnExecutorchModules.ts +4 -50
- package/src/types/common.ts +40 -12
- package/src/types/llm.ts +10 -0
- package/src/types/stt.ts +87 -90
- package/src/types/vad.ts +4 -0
- package/src/utils/ResourceFetcher.ts +342 -120
- package/src/utils/ResourceFetcherUtils.ts +184 -0
- package/src/utils/llm.ts +65 -1
- package/third-party/android/libs/cpuinfo/arm64-v8a/libcpuinfo.so +0 -0
- package/third-party/android/libs/executorch/arm64-v8a/libexecutorch.so +0 -0
- package/third-party/android/libs/executorch/x86_64/libexecutorch.so +0 -0
- package/third-party/android/libs/opencv/arm64-v8a/libopencv_core.a +0 -0
- package/third-party/android/libs/opencv/arm64-v8a/libopencv_features2d.a +0 -0
- package/third-party/android/libs/opencv/arm64-v8a/libopencv_highgui.a +0 -0
- package/third-party/android/libs/opencv/arm64-v8a/libopencv_imgproc.a +0 -0
- package/third-party/android/libs/opencv/arm64-v8a/libopencv_photo.a +0 -0
- package/third-party/android/libs/opencv/arm64-v8a/libopencv_video.a +0 -0
- package/third-party/android/libs/opencv/x86_64/libopencv_core.a +0 -0
- package/third-party/android/libs/opencv/x86_64/libopencv_features2d.a +0 -0
- package/third-party/android/libs/opencv/x86_64/libopencv_highgui.a +0 -0
- package/third-party/android/libs/opencv/x86_64/libopencv_imgproc.a +0 -0
- package/third-party/android/libs/opencv/x86_64/libopencv_photo.a +0 -0
- package/third-party/android/libs/opencv/x86_64/libopencv_video.a +0 -0
- package/third-party/android/libs/opencv-third-party/arm64-v8a/libkleidicv.a +0 -0
- package/third-party/android/libs/opencv-third-party/arm64-v8a/libkleidicv_hal.a +0 -0
- package/third-party/android/libs/opencv-third-party/arm64-v8a/libkleidicv_thread.a +0 -0
- package/third-party/android/libs/pthreadpool/arm64-v8a/libpthreadpool.so +0 -0
- package/third-party/android/libs/tokenizers-cpp/arm64-v8a/libsentencepiece.a +0 -0
- package/third-party/android/libs/tokenizers-cpp/arm64-v8a/libtokenizers_c.a +0 -0
- package/third-party/android/libs/tokenizers-cpp/arm64-v8a/libtokenizers_cpp.a +0 -0
- package/{ios/ExecutorchLib.xcframework/ios-arm64-simulator/ExecutorchLib.framework/ExecutorchLib → third-party/android/libs/tokenizers-cpp/x86_64/libsentencepiece.a} +0 -0
- package/third-party/android/libs/tokenizers-cpp/x86_64/libtokenizers_c.a +0 -0
- package/third-party/android/libs/tokenizers-cpp/x86_64/libtokenizers_cpp.a +0 -0
- package/third-party/include/c10/macros/Export.h +1 -0
- package/third-party/include/c10/macros/Macros.h +1 -0
- package/third-party/include/c10/util/BFloat16-inl.h +1 -0
- package/third-party/include/c10/util/BFloat16-math.h +266 -0
- package/third-party/include/c10/util/BFloat16.h +1 -0
- package/third-party/include/c10/util/Half-inl.h +1 -0
- package/third-party/include/c10/util/Half.h +8 -0
- package/third-party/include/c10/util/TypeSafeSignMath.h +1 -0
- package/third-party/include/c10/util/bit_cast.h +1 -0
- package/third-party/include/c10/util/complex.h +72 -0
- package/third-party/include/c10/util/complex_math.h +399 -0
- package/third-party/include/c10/util/complex_utils.h +41 -0
- package/third-party/include/c10/util/floating_point_utils.h +1 -0
- package/third-party/include/c10/util/irange.h +107 -0
- package/third-party/include/c10/util/llvmMathExtras.h +866 -0
- package/third-party/include/c10/util/overflows.h +95 -0
- package/third-party/include/c10/util/safe_numerics.h +97 -0
- package/third-party/include/cpuinfo/cpuinfo.h +2305 -0
- package/third-party/include/executorch/ExecuTorch.h +13 -0
- package/third-party/include/executorch/ExecuTorchError.h +90 -0
- package/third-party/include/executorch/ExecuTorchLLM/ExecuTorchLLM.h +12 -0
- package/third-party/include/executorch/ExecuTorchLLM/ExecuTorchLLMConfig.h +56 -0
- package/third-party/include/executorch/ExecuTorchLLM/ExecuTorchLLMError.h +16 -0
- package/third-party/include/executorch/ExecuTorchLLM/ExecuTorchLLMMultimodalRunner.h +227 -0
- package/third-party/include/executorch/ExecuTorchLLM/ExecuTorchLLMTextRunner.h +97 -0
- package/third-party/include/executorch/ExecuTorchLLM/module.modulemap +4 -0
- package/third-party/include/executorch/ExecuTorchLog.h +77 -0
- package/third-party/include/executorch/ExecuTorchModule.h +563 -0
- package/third-party/include/executorch/ExecuTorchTensor.h +1421 -0
- package/third-party/include/executorch/ExecuTorchValue.h +265 -0
- package/third-party/include/executorch/extension/module/bundled_module.h +131 -0
- package/third-party/include/executorch/extension/module/module.h +649 -0
- package/third-party/include/executorch/extension/tensor/tensor.h +14 -0
- package/third-party/include/executorch/extension/tensor/tensor_accessor.h +190 -0
- package/third-party/include/executorch/extension/tensor/tensor_ptr.h +409 -0
- package/third-party/include/executorch/extension/tensor/tensor_ptr_maker.h +653 -0
- package/third-party/include/executorch/extension/threadpool/cpuinfo_utils.h +24 -0
- package/third-party/include/executorch/extension/threadpool/threadpool.h +95 -0
- package/third-party/include/executorch/runtime/backend/backend_execution_context.h +71 -0
- package/third-party/include/executorch/runtime/backend/backend_init_context.h +84 -0
- package/third-party/include/executorch/runtime/backend/backend_option_context.h +34 -0
- package/third-party/include/executorch/runtime/backend/interface.h +227 -0
- package/third-party/include/executorch/runtime/backend/options.h +206 -0
- package/third-party/include/executorch/runtime/core/array_ref.h +235 -0
- package/third-party/include/executorch/runtime/core/data_loader.h +136 -0
- package/third-party/include/executorch/runtime/core/defines.h +20 -0
- package/third-party/include/executorch/runtime/core/error.h +256 -0
- package/third-party/include/executorch/runtime/core/evalue.h +515 -0
- package/third-party/include/executorch/runtime/core/event_tracer.h +580 -0
- package/third-party/include/executorch/runtime/core/event_tracer_hooks.h +332 -0
- package/third-party/include/executorch/runtime/core/event_tracer_hooks_delegate.h +197 -0
- package/third-party/include/executorch/runtime/core/exec_aten/exec_aten.h +170 -0
- package/third-party/include/executorch/runtime/core/exec_aten/util/dim_order_util.h +264 -0
- package/third-party/include/executorch/runtime/core/exec_aten/util/scalar_type_util.h +1313 -0
- package/third-party/include/executorch/runtime/core/exec_aten/util/tensor_dimension_limit.h +21 -0
- package/third-party/include/executorch/runtime/core/exec_aten/util/tensor_shape_to_c_string.h +69 -0
- package/third-party/include/executorch/runtime/core/exec_aten/util/tensor_util.h +1251 -0
- package/third-party/include/executorch/runtime/core/freeable_buffer.h +107 -0
- package/third-party/include/executorch/runtime/core/function_ref.h +100 -0
- package/third-party/include/executorch/runtime/core/hierarchical_allocator.h +107 -0
- package/third-party/include/executorch/runtime/core/memory_allocator.h +208 -0
- package/third-party/include/executorch/runtime/core/named_data_map.h +76 -0
- package/third-party/include/executorch/runtime/core/portable_type/bfloat16.h +27 -0
- package/third-party/include/executorch/runtime/core/portable_type/bfloat16_math.h +14 -0
- package/third-party/include/executorch/runtime/core/portable_type/bits_types.h +83 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/macros/Export.h +1 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/macros/Macros.h +1 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/util/BFloat16-inl.h +1 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/util/BFloat16-math.h +266 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/util/BFloat16.h +1 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/util/Half-inl.h +1 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/util/Half.h +8 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/util/TypeSafeSignMath.h +1 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/util/bit_cast.h +1 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/util/complex.h +72 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/util/complex_math.h +399 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/util/complex_utils.h +41 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/util/floating_point_utils.h +1 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/util/irange.h +107 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/util/llvmMathExtras.h +866 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/util/overflows.h +95 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/c10/util/safe_numerics.h +97 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/torch/headeronly/macros/Export.h +154 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/torch/headeronly/macros/Macros.h +553 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/torch/headeronly/util/BFloat16.h +477 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/torch/headeronly/util/Half.h +781 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/torch/headeronly/util/TypeSafeSignMath.h +141 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/torch/headeronly/util/bit_cast.h +49 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/torch/headeronly/util/complex.h +593 -0
- package/third-party/include/executorch/runtime/core/portable_type/c10/torch/headeronly/util/floating_point_utils.h +38 -0
- package/third-party/include/executorch/runtime/core/portable_type/complex.h +21 -0
- package/third-party/include/executorch/runtime/core/portable_type/device.h +70 -0
- package/third-party/include/executorch/runtime/core/portable_type/half.h +27 -0
- package/third-party/include/executorch/runtime/core/portable_type/optional.h +36 -0
- package/third-party/include/executorch/runtime/core/portable_type/qint_types.h +83 -0
- package/third-party/include/executorch/runtime/core/portable_type/scalar.h +110 -0
- package/third-party/include/executorch/runtime/core/portable_type/scalar_type.h +154 -0
- package/third-party/include/executorch/runtime/core/portable_type/string_view.h +29 -0
- package/third-party/include/executorch/runtime/core/portable_type/tensor.h +142 -0
- package/third-party/include/executorch/runtime/core/portable_type/tensor_impl.h +281 -0
- package/third-party/include/executorch/runtime/core/portable_type/tensor_options.h +60 -0
- package/third-party/include/executorch/runtime/core/result.h +258 -0
- package/third-party/include/executorch/runtime/core/span.h +97 -0
- package/third-party/include/executorch/runtime/core/tag.h +90 -0
- package/third-party/include/executorch/runtime/core/tensor_layout.h +79 -0
- package/third-party/include/executorch/runtime/core/tensor_shape_dynamism.h +39 -0
- package/third-party/include/executorch/runtime/executor/memory_manager.h +113 -0
- package/third-party/include/executorch/runtime/executor/merged_data_map.h +142 -0
- package/third-party/include/executorch/runtime/executor/method.h +412 -0
- package/third-party/include/executorch/runtime/executor/method_meta.h +298 -0
- package/third-party/include/executorch/runtime/executor/program.h +309 -0
- package/third-party/include/executorch/runtime/executor/pte_data_map.h +145 -0
- package/third-party/include/executorch/runtime/executor/tensor_parser.h +157 -0
- package/third-party/include/executorch/runtime/kernel/kernel_runtime_context.h +122 -0
- package/third-party/include/executorch/runtime/kernel/operator_registry.h +280 -0
- package/third-party/include/executorch/runtime/platform/abort.h +36 -0
- package/third-party/include/executorch/runtime/platform/assert.h +119 -0
- package/third-party/include/executorch/runtime/platform/clock.h +43 -0
- package/third-party/include/executorch/runtime/platform/compat_unistd.h +75 -0
- package/third-party/include/executorch/runtime/platform/compiler.h +201 -0
- package/third-party/include/executorch/runtime/platform/log.h +177 -0
- package/third-party/include/executorch/runtime/platform/platform.h +259 -0
- package/third-party/include/executorch/runtime/platform/profiler.h +292 -0
- package/third-party/include/executorch/runtime/platform/runtime.h +35 -0
- package/third-party/include/executorch/runtime/platform/system.h +49 -0
- package/third-party/include/executorch/runtime/platform/types.h +24 -0
- package/third-party/include/executorch/schema/extended_header.h +85 -0
- package/third-party/include/headeronly/macros/Export.h +88 -0
- package/third-party/include/opencv2/core/affine.hpp +676 -0
- package/third-party/include/opencv2/core/async.hpp +107 -0
- package/third-party/include/opencv2/core/base.hpp +735 -0
- package/third-party/include/opencv2/core/bindings_utils.hpp +279 -0
- package/third-party/include/opencv2/core/bufferpool.hpp +39 -0
- package/third-party/include/opencv2/core/check.hpp +231 -0
- package/third-party/include/opencv2/core/core.hpp +55 -0
- package/third-party/include/opencv2/core/core_c.h +3261 -0
- package/third-party/include/opencv2/core/cv_cpu_dispatch.h +404 -0
- package/third-party/include/opencv2/core/cv_cpu_helper.h +856 -0
- package/third-party/include/opencv2/core/cvdef.h +1003 -0
- package/third-party/include/opencv2/core/cvstd.hpp +196 -0
- package/third-party/include/opencv2/core/cvstd.inl.hpp +188 -0
- package/third-party/include/opencv2/core/cvstd_wrapper.hpp +187 -0
- package/third-party/include/opencv2/core/detail/async_promise.hpp +73 -0
- package/third-party/include/opencv2/core/detail/dispatch_helper.impl.hpp +48 -0
- package/third-party/include/opencv2/core/detail/exception_ptr.hpp +24 -0
- package/third-party/include/opencv2/core/dualquaternion.hpp +1054 -0
- package/third-party/include/opencv2/core/dualquaternion.inl.hpp +464 -0
- package/third-party/include/opencv2/core/eigen.hpp +405 -0
- package/third-party/include/opencv2/core/fast_math.hpp +433 -0
- package/third-party/include/opencv2/core/hal/hal.hpp +451 -0
- package/third-party/include/opencv2/core/hal/interface.h +191 -0
- package/third-party/include/opencv2/core/hal/intrin.hpp +1222 -0
- package/third-party/include/opencv2/core/hal/intrin_avx.hpp +3378 -0
- package/third-party/include/opencv2/core/hal/intrin_avx512.hpp +3688 -0
- package/third-party/include/opencv2/core/hal/intrin_cpp.hpp +3446 -0
- package/third-party/include/opencv2/core/hal/intrin_forward.hpp +195 -0
- package/third-party/include/opencv2/core/hal/intrin_lasx.hpp +3243 -0
- package/third-party/include/opencv2/core/hal/intrin_lsx.hpp +2671 -0
- package/third-party/include/opencv2/core/hal/intrin_math.hpp +772 -0
- package/third-party/include/opencv2/core/hal/intrin_msa.hpp +1973 -0
- package/third-party/include/opencv2/core/hal/intrin_neon.hpp +2710 -0
- package/third-party/include/opencv2/core/hal/intrin_rvv071.hpp +3452 -0
- package/third-party/include/opencv2/core/hal/intrin_rvv_scalable.hpp +2559 -0
- package/third-party/include/opencv2/core/hal/intrin_sse.hpp +3528 -0
- package/third-party/include/opencv2/core/hal/intrin_sse_em.hpp +175 -0
- package/third-party/include/opencv2/core/hal/intrin_vsx.hpp +1756 -0
- package/third-party/include/opencv2/core/hal/intrin_wasm.hpp +2911 -0
- package/third-party/include/opencv2/core/hal/msa_macros.h +2079 -0
- package/third-party/include/opencv2/core/hal/simd_utils.impl.hpp +313 -0
- package/third-party/include/opencv2/core/mat.hpp +3842 -0
- package/third-party/include/opencv2/core/mat.inl.hpp +2753 -0
- package/third-party/include/opencv2/core/matx.hpp +603 -0
- package/third-party/include/opencv2/core/matx.inl.hpp +1132 -0
- package/third-party/include/opencv2/core/neon_utils.hpp +127 -0
- package/third-party/include/opencv2/core/operations.hpp +610 -0
- package/third-party/include/opencv2/core/optim.hpp +362 -0
- package/third-party/include/opencv2/core/parallel/backend/parallel_for.openmp.hpp +66 -0
- package/third-party/include/opencv2/core/parallel/backend/parallel_for.tbb.hpp +148 -0
- package/third-party/include/opencv2/core/parallel/parallel_backend.hpp +108 -0
- package/third-party/include/opencv2/core/persistence.hpp +1321 -0
- package/third-party/include/opencv2/core/quaternion.hpp +1889 -0
- package/third-party/include/opencv2/core/quaternion.inl.hpp +907 -0
- package/third-party/include/opencv2/core/saturate.hpp +347 -0
- package/third-party/include/opencv2/core/simd_intrinsics.hpp +90 -0
- package/third-party/include/opencv2/core/softfloat.hpp +657 -0
- package/third-party/include/opencv2/core/sse_utils.hpp +861 -0
- package/third-party/include/opencv2/core/traits.hpp +417 -0
- package/third-party/include/opencv2/core/types.hpp +2368 -0
- package/third-party/include/opencv2/core/types_c.h +2064 -0
- package/third-party/include/opencv2/core/utility.hpp +1296 -0
- package/third-party/include/opencv2/core/utils/allocator_stats.hpp +31 -0
- package/third-party/include/opencv2/core/utils/allocator_stats.impl.hpp +111 -0
- package/third-party/include/opencv2/core/utils/filesystem.hpp +91 -0
- package/third-party/include/opencv2/core/utils/fp_control_utils.hpp +70 -0
- package/third-party/include/opencv2/core/utils/instrumentation.hpp +127 -0
- package/third-party/include/opencv2/core/utils/logger.defines.hpp +50 -0
- package/third-party/include/opencv2/core/utils/logger.hpp +258 -0
- package/third-party/include/opencv2/core/utils/logtag.hpp +27 -0
- package/third-party/include/opencv2/core/utils/tls.hpp +230 -0
- package/third-party/include/opencv2/core/utils/trace.hpp +281 -0
- package/third-party/include/opencv2/core/version.hpp +29 -0
- package/third-party/include/opencv2/core/vsx_utils.hpp +1115 -0
- package/third-party/include/opencv2/core.hpp +3699 -0
- package/third-party/include/opencv2/cvconfig.h +155 -0
- package/third-party/include/opencv2/dnn/dnn.hpp +51 -0
- package/third-party/include/opencv2/dnn.hpp +17 -0
- package/third-party/include/opencv2/features2d/features2d.hpp +55 -0
- package/third-party/include/opencv2/features2d/hal/interface.h +32 -0
- package/third-party/include/opencv2/features2d.hpp +1756 -0
- package/third-party/include/opencv2/highgui/highgui.hpp +113 -0
- package/third-party/include/opencv2/highgui.hpp +17 -0
- package/third-party/include/opencv2/imgproc/bindings.hpp +34 -0
- package/third-party/include/opencv2/imgproc/detail/gcgraph.hpp +355 -0
- package/third-party/include/opencv2/imgproc/detail/legacy.hpp +35 -0
- package/third-party/include/opencv2/imgproc/hal/hal.hpp +246 -0
- package/third-party/include/opencv2/imgproc/hal/interface.h +52 -0
- package/third-party/include/opencv2/imgproc/imgproc.hpp +55 -0
- package/third-party/include/opencv2/imgproc/imgproc_c.h +1261 -0
- package/third-party/include/opencv2/imgproc/segmentation.hpp +168 -0
- package/third-party/include/opencv2/imgproc/types_c.h +632 -0
- package/third-party/include/opencv2/imgproc.hpp +5956 -0
- package/third-party/include/opencv2/opencv.hpp +102 -0
- package/third-party/include/opencv2/opencv_modules.hpp +19 -0
- package/third-party/include/opencv2/photo/legacy/constants_c.h +10 -0
- package/third-party/include/opencv2/photo/photo.hpp +55 -0
- package/third-party/include/opencv2/photo.hpp +975 -0
- package/third-party/include/opencv2/video/background_segm.hpp +341 -0
- package/third-party/include/opencv2/video/detail/tracking.detail.hpp +435 -0
- package/third-party/include/opencv2/video/legacy/constants_c.h +15 -0
- package/third-party/include/opencv2/video/tracking.hpp +1014 -0
- package/third-party/include/opencv2/video/video.hpp +55 -0
- package/third-party/include/opencv2/video.hpp +65 -0
- package/third-party/include/pthreadpool/pthreadpool.h +2236 -0
- package/third-party/include/tokenizers-cpp/tokenizers_c.h +61 -0
- package/third-party/include/tokenizers-cpp/tokenizers_cpp.h +118 -0
- package/third-party/include/torch/headeronly/macros/Export.h +154 -0
- package/third-party/include/torch/headeronly/macros/Macros.h +553 -0
- package/third-party/include/torch/headeronly/util/BFloat16.h +477 -0
- package/third-party/include/torch/headeronly/util/Half.h +781 -0
- package/third-party/include/torch/headeronly/util/TypeSafeSignMath.h +141 -0
- package/third-party/include/torch/headeronly/util/bit_cast.h +49 -0
- package/third-party/include/torch/headeronly/util/complex.h +593 -0
- package/third-party/include/torch/headeronly/util/floating_point_utils.h +38 -0
- package/third-party/ios/ExecutorchLib.xcframework/ios-arm64/ExecutorchLib.framework/ExecutorchLib +0 -0
- package/{ios → third-party/ios}/ExecutorchLib.xcframework/ios-arm64/ExecutorchLib.framework/Info.plist +0 -0
- package/third-party/ios/ExecutorchLib.xcframework/ios-arm64-simulator/ExecutorchLib.framework/ExecutorchLib +0 -0
- package/{ios → third-party/ios}/ExecutorchLib.xcframework/ios-arm64-simulator/ExecutorchLib.framework/Info.plist +0 -0
- package/third-party/ios/libs/cpuinfo/libcpuinfo.a +0 -0
- package/third-party/ios/libs/pthreadpool/physical-arm64-release/libpthreadpool.a +0 -0
- package/third-party/ios/libs/pthreadpool/simulator-arm64-debug/libpthreadpool.a +0 -0
- package/third-party/ios/libs/tokenizers-cpp/physical-arm64-release/libsentencepiece.a +0 -0
- package/{ios/ExecutorchLib.xcframework/ios-arm64/ExecutorchLib.framework/ExecutorchLib → third-party/ios/libs/tokenizers-cpp/physical-arm64-release/libtokenizers_c.a} +0 -0
- package/third-party/ios/libs/tokenizers-cpp/physical-arm64-release/libtokenizers_cpp.a +0 -0
- package/third-party/ios/libs/tokenizers-cpp/simulator-arm64-debug/libsentencepiece.a +0 -0
- package/third-party/ios/libs/tokenizers-cpp/simulator-arm64-debug/libtokenizers_c.a +0 -0
- package/third-party/ios/libs/tokenizers-cpp/simulator-arm64-debug/libtokenizers_cpp.a +0 -0
- package/LICENSE +0 -79
- package/android/src/main/java/com/swmansion/rnexecutorch/Classification.kt +0 -64
- package/android/src/main/java/com/swmansion/rnexecutorch/ETModule.kt +0 -90
- package/android/src/main/java/com/swmansion/rnexecutorch/ImageSegmentation.kt +0 -58
- package/android/src/main/java/com/swmansion/rnexecutorch/LLM.kt +0 -63
- package/android/src/main/java/com/swmansion/rnexecutorch/OCR.kt +0 -90
- package/android/src/main/java/com/swmansion/rnexecutorch/ObjectDetection.kt +0 -64
- package/android/src/main/java/com/swmansion/rnexecutorch/SpeechToText.kt +0 -91
- package/android/src/main/java/com/swmansion/rnexecutorch/StyleTransfer.kt +0 -54
- package/android/src/main/java/com/swmansion/rnexecutorch/TextEmbeddings.kt +0 -51
- package/android/src/main/java/com/swmansion/rnexecutorch/Tokenizer.kt +0 -86
- package/android/src/main/java/com/swmansion/rnexecutorch/VerticalOCR.kt +0 -179
- package/android/src/main/java/com/swmansion/rnexecutorch/models/BaseModel.kt +0 -54
- package/android/src/main/java/com/swmansion/rnexecutorch/models/TextEmbeddings/TextEmbeddingsModel.kt +0 -48
- package/android/src/main/java/com/swmansion/rnexecutorch/models/TextEmbeddings/TextEmbeddingsUtils.kt +0 -37
- package/android/src/main/java/com/swmansion/rnexecutorch/models/classification/ClassificationModel.kt +0 -46
- package/android/src/main/java/com/swmansion/rnexecutorch/models/classification/Constants.kt +0 -1005
- package/android/src/main/java/com/swmansion/rnexecutorch/models/imageSegmentation/Constants.kt +0 -26
- package/android/src/main/java/com/swmansion/rnexecutorch/models/imageSegmentation/ImageSegmentationModel.kt +0 -142
- package/android/src/main/java/com/swmansion/rnexecutorch/models/objectDetection/SSDLiteLargeModel.kt +0 -74
- package/android/src/main/java/com/swmansion/rnexecutorch/models/ocr/Detector.kt +0 -82
- package/android/src/main/java/com/swmansion/rnexecutorch/models/ocr/RecognitionHandler.kt +0 -117
- package/android/src/main/java/com/swmansion/rnexecutorch/models/ocr/Recognizer.kt +0 -51
- package/android/src/main/java/com/swmansion/rnexecutorch/models/ocr/VerticalDetector.kt +0 -89
- package/android/src/main/java/com/swmansion/rnexecutorch/models/ocr/utils/CTCLabelConverter.kt +0 -58
- package/android/src/main/java/com/swmansion/rnexecutorch/models/ocr/utils/Constants.kt +0 -31
- package/android/src/main/java/com/swmansion/rnexecutorch/models/ocr/utils/DetectorUtils.kt +0 -608
- package/android/src/main/java/com/swmansion/rnexecutorch/models/ocr/utils/RecognizerUtils.kt +0 -430
- package/android/src/main/java/com/swmansion/rnexecutorch/models/speechToText/BaseS2TDecoder.kt +0 -39
- package/android/src/main/java/com/swmansion/rnexecutorch/models/speechToText/BaseS2TModule.kt +0 -43
- package/android/src/main/java/com/swmansion/rnexecutorch/models/speechToText/Moonshine.kt +0 -16
- package/android/src/main/java/com/swmansion/rnexecutorch/models/speechToText/MoonshineDecoder.kt +0 -23
- package/android/src/main/java/com/swmansion/rnexecutorch/models/speechToText/MoonshineEncoder.kt +0 -20
- package/android/src/main/java/com/swmansion/rnexecutorch/models/speechToText/Whisper.kt +0 -16
- package/android/src/main/java/com/swmansion/rnexecutorch/models/speechToText/WhisperDecoder.kt +0 -22
- package/android/src/main/java/com/swmansion/rnexecutorch/models/speechToText/WhisperEncoder.kt +0 -29
- package/android/src/main/java/com/swmansion/rnexecutorch/models/styleTransfer/StyleTransferModel.kt +0 -43
- package/android/src/main/java/com/swmansion/rnexecutorch/utils/ArrayUtils.kt +0 -87
- package/android/src/main/java/com/swmansion/rnexecutorch/utils/ETError.kt +0 -34
- package/android/src/main/java/com/swmansion/rnexecutorch/utils/ImageProcessor.kt +0 -237
- package/android/src/main/java/com/swmansion/rnexecutorch/utils/Numerical.kt +0 -8
- package/android/src/main/java/com/swmansion/rnexecutorch/utils/ObjectDetectionUtils.kt +0 -201
- package/android/src/main/java/com/swmansion/rnexecutorch/utils/STFT.kt +0 -50
- package/android/src/main/java/com/swmansion/rnexecutorch/utils/TensorUtils.kt +0 -103
- package/ios/ExecutorchLib.xcframework/ios-arm64/ExecutorchLib.framework/Headers/ETModel.h +0 -27
- package/ios/ExecutorchLib.xcframework/ios-arm64/ExecutorchLib.framework/Headers/HuggingFaceTokenizer.h +0 -14
- package/ios/ExecutorchLib.xcframework/ios-arm64/ExecutorchLib.framework/Headers/LLaMARunner.h +0 -32
- package/ios/ExecutorchLib.xcframework/ios-arm64-simulator/ExecutorchLib.framework/Headers/ETModel.h +0 -27
- package/ios/ExecutorchLib.xcframework/ios-arm64-simulator/ExecutorchLib.framework/Headers/HuggingFaceTokenizer.h +0 -14
- package/ios/ExecutorchLib.xcframework/ios-arm64-simulator/ExecutorchLib.framework/Headers/LLaMARunner.h +0 -32
- package/ios/RnExecutorch/Classification.h +0 -5
- package/ios/RnExecutorch/Classification.mm +0 -54
- package/ios/RnExecutorch/ETModule.h +0 -5
- package/ios/RnExecutorch/ETModule.mm +0 -75
- package/ios/RnExecutorch/ImageSegmentation.h +0 -5
- package/ios/RnExecutorch/ImageSegmentation.mm +0 -60
- package/ios/RnExecutorch/LLM.h +0 -5
- package/ios/RnExecutorch/LLM.mm +0 -78
- package/ios/RnExecutorch/OCR.h +0 -5
- package/ios/RnExecutorch/OCR.mm +0 -96
- package/ios/RnExecutorch/ObjectDetection.h +0 -5
- package/ios/RnExecutorch/ObjectDetection.mm +0 -56
- package/ios/RnExecutorch/SpeechToText.h +0 -5
- package/ios/RnExecutorch/SpeechToText.mm +0 -125
- package/ios/RnExecutorch/StyleTransfer.h +0 -5
- package/ios/RnExecutorch/StyleTransfer.mm +0 -55
- package/ios/RnExecutorch/TextEmbeddings.h +0 -5
- package/ios/RnExecutorch/TextEmbeddings.mm +0 -62
- package/ios/RnExecutorch/Tokenizer.h +0 -5
- package/ios/RnExecutorch/Tokenizer.mm +0 -83
- package/ios/RnExecutorch/VerticalOCR.h +0 -5
- package/ios/RnExecutorch/VerticalOCR.mm +0 -183
- package/ios/RnExecutorch/models/BaseModel.h +0 -21
- package/ios/RnExecutorch/models/BaseModel.mm +0 -43
- package/ios/RnExecutorch/models/classification/ClassificationModel.h +0 -10
- package/ios/RnExecutorch/models/classification/ClassificationModel.mm +0 -53
- package/ios/RnExecutorch/models/classification/Constants.h +0 -3
- package/ios/RnExecutorch/models/image_segmentation/Constants.h +0 -4
- package/ios/RnExecutorch/models/image_segmentation/ImageSegmentationModel.h +0 -10
- package/ios/RnExecutorch/models/image_segmentation/ImageSegmentationModel.mm +0 -146
- package/ios/RnExecutorch/models/object_detection/SSDLiteLargeModel.hpp +0 -11
- package/ios/RnExecutorch/models/object_detection/SSDLiteLargeModel.mm +0 -64
- package/ios/RnExecutorch/models/ocr/Detector.h +0 -9
- package/ios/RnExecutorch/models/ocr/Detector.mm +0 -101
- package/ios/RnExecutorch/models/ocr/RecognitionHandler.h +0 -16
- package/ios/RnExecutorch/models/ocr/RecognitionHandler.mm +0 -135
- package/ios/RnExecutorch/models/ocr/Recognizer.h +0 -8
- package/ios/RnExecutorch/models/ocr/Recognizer.mm +0 -77
- package/ios/RnExecutorch/models/ocr/VerticalDetector.h +0 -10
- package/ios/RnExecutorch/models/ocr/VerticalDetector.mm +0 -118
- package/ios/RnExecutorch/models/ocr/utils/CTCLabelConverter.h +0 -16
- package/ios/RnExecutorch/models/ocr/utils/CTCLabelConverter.mm +0 -80
- package/ios/RnExecutorch/models/ocr/utils/Constants.h +0 -26
- package/ios/RnExecutorch/models/ocr/utils/DetectorUtils.h +0 -31
- package/ios/RnExecutorch/models/ocr/utils/DetectorUtils.mm +0 -754
- package/ios/RnExecutorch/models/ocr/utils/OCRUtils.h +0 -10
- package/ios/RnExecutorch/models/ocr/utils/OCRUtils.mm +0 -67
- package/ios/RnExecutorch/models/ocr/utils/RecognizerUtils.h +0 -35
- package/ios/RnExecutorch/models/ocr/utils/RecognizerUtils.mm +0 -331
- package/ios/RnExecutorch/models/stt/Moonshine.hpp +0 -13
- package/ios/RnExecutorch/models/stt/Moonshine.mm +0 -64
- package/ios/RnExecutorch/models/stt/MoonshineDecoder.hpp +0 -16
- package/ios/RnExecutorch/models/stt/MoonshineDecoder.mm +0 -24
- package/ios/RnExecutorch/models/stt/MoonshineEncoder.hpp +0 -15
- package/ios/RnExecutorch/models/stt/MoonshineEncoder.mm +0 -18
- package/ios/RnExecutorch/models/stt/SpeechToTextBaseModel.hpp +0 -26
- package/ios/RnExecutorch/models/stt/SpeechToTextBaseModel.mm +0 -19
- package/ios/RnExecutorch/models/stt/Whisper.hpp +0 -12
- package/ios/RnExecutorch/models/stt/Whisper.mm +0 -68
- package/ios/RnExecutorch/models/stt/WhisperDecoder.hpp +0 -16
- package/ios/RnExecutorch/models/stt/WhisperDecoder.mm +0 -22
- package/ios/RnExecutorch/models/stt/WhisperEncoder.hpp +0 -15
- package/ios/RnExecutorch/models/stt/WhisperEncoder.mm +0 -21
- package/ios/RnExecutorch/models/style_transfer/StyleTransferModel.h +0 -11
- package/ios/RnExecutorch/models/style_transfer/StyleTransferModel.mm +0 -50
- package/ios/RnExecutorch/models/text_embeddings/TextEmbeddingsModel.h +0 -15
- package/ios/RnExecutorch/models/text_embeddings/TextEmbeddingsModel.mm +0 -45
- package/ios/RnExecutorch/models/text_embeddings/TextEmbeddingsUtils.h +0 -8
- package/ios/RnExecutorch/models/text_embeddings/TextEmbeddingsUtils.mm +0 -49
- package/ios/RnExecutorch/utils/Constants.h +0 -8
- package/ios/RnExecutorch/utils/Conversions.h +0 -15
- package/ios/RnExecutorch/utils/ETError.h +0 -26
- package/ios/RnExecutorch/utils/ImageProcessor.h +0 -15
- package/ios/RnExecutorch/utils/ImageProcessor.mm +0 -147
- package/ios/RnExecutorch/utils/Numerical.h +0 -1
- package/ios/RnExecutorch/utils/Numerical.mm +0 -18
- package/ios/RnExecutorch/utils/ObjectDetectionUtils.hpp +0 -23
- package/ios/RnExecutorch/utils/SFFT.hpp +0 -13
- package/ios/RnExecutorch/utils/SFFT.mm +0 -71
- package/ios/RnExecutorch/utils/ScalarType.h +0 -14
- package/ios/RnExecutorch/utils/ScalarType.mm +0 -21
- package/lib/module/constants/sttDefaults.js +0 -72
- package/lib/module/constants/sttDefaults.js.map +0 -1
- package/lib/module/controllers/SpeechToTextController.js +0 -307
- package/lib/module/controllers/SpeechToTextController.js.map +0 -1
- package/lib/module/native/NativeClassification.js +0 -5
- package/lib/module/native/NativeClassification.js.map +0 -1
- package/lib/module/native/NativeETModule.js +0 -5
- package/lib/module/native/NativeETModule.js.map +0 -1
- package/lib/module/native/NativeImageSegmentation.js +0 -5
- package/lib/module/native/NativeImageSegmentation.js.map +0 -1
- package/lib/module/native/NativeLLM.js +0 -5
- package/lib/module/native/NativeLLM.js.map +0 -1
- package/lib/module/native/NativeOCR.js +0 -5
- package/lib/module/native/NativeOCR.js.map +0 -1
- package/lib/module/native/NativeObjectDetection.js +0 -5
- package/lib/module/native/NativeObjectDetection.js.map +0 -1
- package/lib/module/native/NativeSpeechToText.js +0 -5
- package/lib/module/native/NativeSpeechToText.js.map +0 -1
- package/lib/module/native/NativeStyleTransfer.js +0 -5
- package/lib/module/native/NativeStyleTransfer.js.map +0 -1
- package/lib/module/native/NativeTextEmbeddings.js +0 -5
- package/lib/module/native/NativeTextEmbeddings.js.map +0 -1
- package/lib/module/native/NativeTokenizer.js +0 -5
- package/lib/module/native/NativeTokenizer.js.map +0 -1
- package/lib/module/native/NativeVerticalOCR.js +0 -5
- package/lib/module/native/NativeVerticalOCR.js.map +0 -1
- package/lib/module/package.json +0 -1
- package/lib/module/utils/stt.js +0 -22
- package/lib/module/utils/stt.js.map +0 -1
- package/lib/typescript/constants/sttDefaults.d.ts +0 -28
- package/lib/typescript/constants/sttDefaults.d.ts.map +0 -1
- package/lib/typescript/controllers/SpeechToTextController.d.ts +0 -52
- package/lib/typescript/controllers/SpeechToTextController.d.ts.map +0 -1
- package/lib/typescript/native/NativeClassification.d.ts +0 -10
- package/lib/typescript/native/NativeClassification.d.ts.map +0 -1
- package/lib/typescript/native/NativeETModule.d.ts +0 -9
- package/lib/typescript/native/NativeETModule.d.ts.map +0 -1
- package/lib/typescript/native/NativeImageSegmentation.d.ts +0 -10
- package/lib/typescript/native/NativeImageSegmentation.d.ts.map +0 -1
- package/lib/typescript/native/NativeLLM.d.ts +0 -12
- package/lib/typescript/native/NativeLLM.d.ts.map +0 -1
- package/lib/typescript/native/NativeOCR.d.ts +0 -9
- package/lib/typescript/native/NativeOCR.d.ts.map +0 -1
- package/lib/typescript/native/NativeObjectDetection.d.ts +0 -9
- package/lib/typescript/native/NativeObjectDetection.d.ts.map +0 -1
- package/lib/typescript/native/NativeSpeechToText.d.ts +0 -12
- package/lib/typescript/native/NativeSpeechToText.d.ts.map +0 -1
- package/lib/typescript/native/NativeStyleTransfer.d.ts.map +0 -1
- package/lib/typescript/native/NativeTextEmbeddings.d.ts +0 -8
- package/lib/typescript/native/NativeTextEmbeddings.d.ts.map +0 -1
- package/lib/typescript/native/NativeTokenizer.d.ts +0 -12
- package/lib/typescript/native/NativeTokenizer.d.ts.map +0 -1
- package/lib/typescript/native/NativeVerticalOCR.d.ts +0 -9
- package/lib/typescript/native/NativeVerticalOCR.d.ts.map +0 -1
- package/lib/typescript/utils/stt.d.ts +0 -2
- package/lib/typescript/utils/stt.d.ts.map +0 -1
- package/src/constants/sttDefaults.ts +0 -86
- package/src/controllers/SpeechToTextController.ts +0 -458
- package/src/index.tsx +0 -47
- package/src/native/NativeClassification.ts +0 -9
- package/src/native/NativeETModule.ts +0 -14
- package/src/native/NativeImageSegmentation.ts +0 -14
- package/src/native/NativeLLM.ts +0 -14
- package/src/native/NativeOCR.ts +0 -16
- package/src/native/NativeObjectDetection.ts +0 -10
- package/src/native/NativeSpeechToText.ts +0 -17
- package/src/native/NativeStyleTransfer.ts +0 -10
- package/src/native/NativeTextEmbeddings.ts +0 -9
- package/src/native/NativeTokenizer.ts +0 -13
- package/src/native/NativeVerticalOCR.ts +0 -16
- package/src/utils/stt.ts +0 -28
- package/{ios → third-party/ios}/ExecutorchLib.xcframework/Info.plist +4 -4
|
@@ -0,0 +1,369 @@
|
|
|
1
|
+
/*
|
|
2
|
+
* Copyright (c) Meta Platforms, Inc. and affiliates.
|
|
3
|
+
* All rights reserved.
|
|
4
|
+
*
|
|
5
|
+
* This source code is licensed under the BSD-style license found in the
|
|
6
|
+
* LICENSE file in the root directory of this source tree.
|
|
7
|
+
* @lint-ignore-every CLANGTIDY facebook-hte-Deprecated
|
|
8
|
+
*/
|
|
9
|
+
|
|
10
|
+
// A simple llama2 runner that includes preprocessing and post processing logic.
|
|
11
|
+
// The module takes in a string as input and emits a string as output.
|
|
12
|
+
|
|
13
|
+
#include "runner.h"
|
|
14
|
+
#include "util.h"
|
|
15
|
+
#include <ctime>
|
|
16
|
+
#include <fstream>
|
|
17
|
+
#include <iostream>
|
|
18
|
+
|
|
19
|
+
namespace example {
|
|
20
|
+
|
|
21
|
+
using ::executorch::extension::Module;
|
|
22
|
+
using ::executorch::runtime::Error;
|
|
23
|
+
using ::executorch::runtime::Result;
|
|
24
|
+
|
|
25
|
+
std::string loadBytesFromFile(const std::string &path) {
|
|
26
|
+
std::ifstream fs(path, std::ios::in | std::ios::binary);
|
|
27
|
+
if (fs.fail()) {
|
|
28
|
+
throw std::runtime_error("Failed to open tokenizer file");
|
|
29
|
+
}
|
|
30
|
+
std::string data;
|
|
31
|
+
fs.seekg(0, std::ios::end);
|
|
32
|
+
size_t size = static_cast<size_t>(fs.tellg());
|
|
33
|
+
fs.seekg(0, std::ios::beg);
|
|
34
|
+
data.resize(size);
|
|
35
|
+
fs.read(data.data(), size);
|
|
36
|
+
return data;
|
|
37
|
+
}
|
|
38
|
+
|
|
39
|
+
namespace {
|
|
40
|
+
static constexpr auto kEnableDynamicShape = "enable_dynamic_shape";
|
|
41
|
+
static constexpr auto kEosIds = "get_eos_ids";
|
|
42
|
+
static constexpr auto kMaxSeqLen = "get_max_seq_len";
|
|
43
|
+
static constexpr auto kMaxContextLen = "get_max_context_len";
|
|
44
|
+
static constexpr auto kVocabSize = "get_vocab_size";
|
|
45
|
+
static constexpr auto kUseKVCache = "use_kv_cache";
|
|
46
|
+
static constexpr auto kUseSDPAWithKVCache = "use_sdpa_with_kv_cache";
|
|
47
|
+
} // namespace
|
|
48
|
+
|
|
49
|
+
Runner::Runner(Module *module, const std::string &tokenizer_path,
|
|
50
|
+
const llm::GenerationConfig &config)
|
|
51
|
+
: config_(config), module_(module), tokenizer_path_(tokenizer_path),
|
|
52
|
+
metadata_({
|
|
53
|
+
{kEnableDynamicShape, false},
|
|
54
|
+
{kMaxSeqLen, 128},
|
|
55
|
+
{kMaxContextLen, 128},
|
|
56
|
+
{kUseKVCache, true},
|
|
57
|
+
{kUseSDPAWithKVCache, false},
|
|
58
|
+
}) {}
|
|
59
|
+
|
|
60
|
+
bool Runner::is_loaded() const {
|
|
61
|
+
return module_->is_loaded() && tokenizer_ && text_decoder_runner_ &&
|
|
62
|
+
text_prefiller_ && text_token_generator_;
|
|
63
|
+
}
|
|
64
|
+
|
|
65
|
+
Error Runner::load() {
|
|
66
|
+
if (is_loaded()) {
|
|
67
|
+
return Error::Ok;
|
|
68
|
+
}
|
|
69
|
+
|
|
70
|
+
ET_CHECK_OK_OR_RETURN_ERROR(module_->load_method("forward"));
|
|
71
|
+
|
|
72
|
+
// Load tokenizer.
|
|
73
|
+
auto blob = loadBytesFromFile(tokenizer_path_);
|
|
74
|
+
tokenizer_ = tokenizers::Tokenizer::FromBlobJSON(blob);
|
|
75
|
+
|
|
76
|
+
ET_LOG(Info, "Reading metadata from model");
|
|
77
|
+
|
|
78
|
+
auto eos_ids = std::make_unique<std::unordered_set<uint64_t>>();
|
|
79
|
+
metadata_[kVocabSize] = tokenizer_->GetVocabSize();
|
|
80
|
+
|
|
81
|
+
// Load model metadata
|
|
82
|
+
const auto method_names =
|
|
83
|
+
ET_UNWRAP(module_->method_names(), "Failed reading method names");
|
|
84
|
+
for (auto &pair : metadata_) {
|
|
85
|
+
const auto &method_name = pair.first;
|
|
86
|
+
auto &value = pair.second;
|
|
87
|
+
if (method_names.count(method_name)) {
|
|
88
|
+
value = ET_UNWRAP(module_->get(method_name))
|
|
89
|
+
.toScalar()
|
|
90
|
+
.to<decltype(metadata_)::mapped_type>();
|
|
91
|
+
} else {
|
|
92
|
+
ET_LOG(Info, "Method %s not found, using the default value %" PRId64,
|
|
93
|
+
method_name.c_str(), value);
|
|
94
|
+
}
|
|
95
|
+
ET_LOG(Info, "Metadata: %s = %" PRId64, method_name.c_str(), value);
|
|
96
|
+
}
|
|
97
|
+
|
|
98
|
+
// Load EOS token ids
|
|
99
|
+
if (method_names.count(kEosIds)) {
|
|
100
|
+
eos_ids->clear();
|
|
101
|
+
for (const auto &eos_id : ET_UNWRAP(module_->execute(kEosIds))) {
|
|
102
|
+
auto value = eos_id.toScalar().to<int64_t>();
|
|
103
|
+
eos_ids->emplace(value);
|
|
104
|
+
ET_LOG(Info, "eos_id = %" PRId64, value);
|
|
105
|
+
}
|
|
106
|
+
}
|
|
107
|
+
|
|
108
|
+
// Determine missing config values
|
|
109
|
+
// If user does not directly specify configuration parameters such as
|
|
110
|
+
// max_seq_len (i.e. leaves them as default values), they are determined by
|
|
111
|
+
// reading the exported model's methods.
|
|
112
|
+
if (config_.max_seq_len < 0)
|
|
113
|
+
config_.max_seq_len = static_cast<int32_t>(metadata_.at(kMaxSeqLen));
|
|
114
|
+
if (config_.max_context_length < 0)
|
|
115
|
+
config_.max_context_length =
|
|
116
|
+
static_cast<int32_t>(metadata_.at(kMaxContextLen));
|
|
117
|
+
if (config_.max_new_tokens < 0)
|
|
118
|
+
config_.max_new_tokens =
|
|
119
|
+
std::min(config_.max_seq_len, config_.max_context_length);
|
|
120
|
+
if (config_.enable_dynamic_shape)
|
|
121
|
+
config_.enable_dynamic_shape =
|
|
122
|
+
static_cast<bool>(metadata_.at(kEnableDynamicShape));
|
|
123
|
+
if (config_.enable_kv_cache)
|
|
124
|
+
config_.enable_kv_cache = static_cast<bool>(metadata_.at(kUseKVCache));
|
|
125
|
+
|
|
126
|
+
io_manager_ = std::make_unique<llm::IOManager>(*module_);
|
|
127
|
+
text_decoder_runner_ = std::make_unique<llm::TextDecoderRunner>(
|
|
128
|
+
module_, io_manager_.get(), config_.temperature, config_.topp);
|
|
129
|
+
text_prefiller_ = std::make_unique<llm::TextPrefiller>(
|
|
130
|
+
text_decoder_runner_.get(), config_.enable_kv_cache,
|
|
131
|
+
config_.enable_dynamic_shape, config_.max_seq_len);
|
|
132
|
+
|
|
133
|
+
text_token_generator_ = std::make_unique<llm::TextTokenGenerator>(
|
|
134
|
+
tokenizer_.get(), text_decoder_runner_.get(), config_.enable_kv_cache,
|
|
135
|
+
std::move(eos_ids), &stats_);
|
|
136
|
+
|
|
137
|
+
return Error::Ok;
|
|
138
|
+
}
|
|
139
|
+
|
|
140
|
+
// Don't print with the same priority during warmup
|
|
141
|
+
#define RUNNER_ET_LOG(warmup, format, ...) \
|
|
142
|
+
if (warmup) { \
|
|
143
|
+
ET_LOG(Debug, format, __VA_ARGS__); \
|
|
144
|
+
} else { \
|
|
145
|
+
ET_LOG(Info, format, __VA_ARGS__); \
|
|
146
|
+
}
|
|
147
|
+
|
|
148
|
+
Error Runner::generate(const std::string &prompt,
|
|
149
|
+
const llm::GenerationConfig &generation_config,
|
|
150
|
+
std::function<void(const std::string &)> token_callback,
|
|
151
|
+
std::function<void(const llm::Stats &)> stats_callback) {
|
|
152
|
+
// Prepare the inputs.
|
|
153
|
+
// Use ones-initialized inputs.
|
|
154
|
+
ET_CHECK_MSG(!prompt.empty(), "Prompt cannot be null");
|
|
155
|
+
if (!is_loaded()) {
|
|
156
|
+
stats_.model_load_start_ms = llm::time_in_ms();
|
|
157
|
+
ET_CHECK_OK_OR_RETURN_ERROR(load());
|
|
158
|
+
stats_.model_load_end_ms = llm::time_in_ms();
|
|
159
|
+
}
|
|
160
|
+
|
|
161
|
+
if (generation_config.warming) {
|
|
162
|
+
ET_LOG(Info, "Doing a warmup run...");
|
|
163
|
+
}
|
|
164
|
+
|
|
165
|
+
RUNNER_ET_LOG(generation_config.warming,
|
|
166
|
+
"RSS after loading model: %f MiB (0 if unsupported)",
|
|
167
|
+
llm::get_rss_bytes() / 1024.0 / 1024.0);
|
|
168
|
+
|
|
169
|
+
// Wrap the token_callback with print function
|
|
170
|
+
std::function<void(const std::string &)> wrapped_callback =
|
|
171
|
+
[token_callback, &generation_config](const std::string &piece) {
|
|
172
|
+
if (!generation_config.warming) {
|
|
173
|
+
llm::safe_printf(piece.c_str());
|
|
174
|
+
fflush(stdout);
|
|
175
|
+
}
|
|
176
|
+
if (token_callback) {
|
|
177
|
+
token_callback(piece);
|
|
178
|
+
}
|
|
179
|
+
};
|
|
180
|
+
// First token time only measures the time it takes to encode the prompt and
|
|
181
|
+
// return a response token.
|
|
182
|
+
|
|
183
|
+
stats_.inference_start_ms = llm::time_in_ms();
|
|
184
|
+
shouldStop_ = false;
|
|
185
|
+
|
|
186
|
+
// Override main config fields with given generation config if specified
|
|
187
|
+
int32_t max_seq_len = generation_config.max_seq_len >= 0
|
|
188
|
+
? generation_config.max_seq_len
|
|
189
|
+
: config_.max_seq_len;
|
|
190
|
+
int32_t max_context_length = generation_config.max_context_length >= 0
|
|
191
|
+
? generation_config.max_context_length
|
|
192
|
+
: config_.max_context_length;
|
|
193
|
+
int32_t new_tokens_limit = generation_config.max_new_tokens >= 0
|
|
194
|
+
? generation_config.max_new_tokens
|
|
195
|
+
: config_.max_new_tokens;
|
|
196
|
+
float temperature = generation_config.temperature >= 0.F
|
|
197
|
+
? generation_config.temperature
|
|
198
|
+
: config_.temperature;
|
|
199
|
+
float topp =
|
|
200
|
+
generation_config.topp >= 0.F ? generation_config.topp : config_.topp;
|
|
201
|
+
|
|
202
|
+
int64_t context_len_left = static_cast<int64_t>(max_context_length) - pos_;
|
|
203
|
+
|
|
204
|
+
std::vector<int32_t> prompt_tokens = tokenizer_->Encode(prompt);
|
|
205
|
+
std::vector<uint64_t> prompt_tokens_uint64(prompt_tokens.begin(),
|
|
206
|
+
prompt_tokens.end());
|
|
207
|
+
|
|
208
|
+
// encode the (string) prompt into tokens sequence
|
|
209
|
+
int num_prompt_tokens = prompt_tokens.size();
|
|
210
|
+
|
|
211
|
+
ET_CHECK_OR_RETURN_ERROR(num_prompt_tokens >= 1, InvalidArgument,
|
|
212
|
+
"Expected at least 1 prompt token");
|
|
213
|
+
ET_CHECK_OR_RETURN_ERROR(num_prompt_tokens < max_seq_len, InvalidArgument,
|
|
214
|
+
"num_prompt_tokens %d >= max_context_len %" PRId32
|
|
215
|
+
", Max seq length exceeded - please increase max "
|
|
216
|
+
"seq len value in your export script",
|
|
217
|
+
num_prompt_tokens, max_seq_len);
|
|
218
|
+
|
|
219
|
+
// Determine max_new_tokens using the GenerationConfig's resolve method,
|
|
220
|
+
// then subtract pos_ for max_new_tokens.
|
|
221
|
+
int32_t max_new_tokens = resolve_max_new_tokens(
|
|
222
|
+
num_prompt_tokens, max_seq_len, static_cast<int32_t>(context_len_left),
|
|
223
|
+
new_tokens_limit);
|
|
224
|
+
|
|
225
|
+
ET_LOG(Info,
|
|
226
|
+
"Max new tokens resolved: %d, given pos_ %" PRId64
|
|
227
|
+
", num_prompt_tokens %zu, max_context_len %" PRId64,
|
|
228
|
+
max_new_tokens, pos_, prompt_tokens.size(),
|
|
229
|
+
static_cast<int64_t>(max_context_length));
|
|
230
|
+
ET_CHECK_OR_RETURN_ERROR(max_new_tokens > 0, InvalidArgument,
|
|
231
|
+
"Max new tokens %d is less than or equal to 0",
|
|
232
|
+
max_new_tokens);
|
|
233
|
+
|
|
234
|
+
// Prefill first
|
|
235
|
+
// Here feed all tokens to the model and get the next predicted token
|
|
236
|
+
// after the prompt. After that we will enter generate loop.
|
|
237
|
+
|
|
238
|
+
// print prompts
|
|
239
|
+
if (generation_config.echo) {
|
|
240
|
+
wrapped_callback(prompt);
|
|
241
|
+
}
|
|
242
|
+
auto prefill_res = text_prefiller_->prefill(prompt_tokens_uint64, pos_);
|
|
243
|
+
stats_.first_token_ms = llm::time_in_ms();
|
|
244
|
+
stats_.prompt_eval_end_ms = llm::time_in_ms();
|
|
245
|
+
ET_CHECK_OK_OR_RETURN_ERROR(prefill_res.error());
|
|
246
|
+
uint64_t cur_token = prefill_res.get();
|
|
247
|
+
|
|
248
|
+
// print the first token from prefill. No prev_token so use cur_token for it.
|
|
249
|
+
const std::string cur_decoded =
|
|
250
|
+
tokenizer_->Decode(std::vector<int32_t>{static_cast<int32_t>(cur_token)});
|
|
251
|
+
RUNNER_ET_LOG(generation_config.warming,
|
|
252
|
+
"RSS after prompt prefill: %f MiB (0 if unsupported)",
|
|
253
|
+
llm::get_rss_bytes() / 1024.0 / 1024.0);
|
|
254
|
+
|
|
255
|
+
// start the main loop
|
|
256
|
+
prompt_tokens_uint64.push_back(cur_token);
|
|
257
|
+
int64_t num_generated_tokens = ET_UNWRAP(text_token_generator_->generate(
|
|
258
|
+
prompt_tokens_uint64, pos_, max_new_tokens - 1, temperature, topp,
|
|
259
|
+
wrapped_callback));
|
|
260
|
+
|
|
261
|
+
pos_ += num_generated_tokens;
|
|
262
|
+
|
|
263
|
+
stats_.inference_end_ms = llm::time_in_ms();
|
|
264
|
+
if (!generation_config.warming) {
|
|
265
|
+
printf("\n");
|
|
266
|
+
}
|
|
267
|
+
RUNNER_ET_LOG(
|
|
268
|
+
generation_config.warming,
|
|
269
|
+
"RSS after finishing text generation: %f MiB (0 if unsupported)",
|
|
270
|
+
llm::get_rss_bytes() / 1024.0 / 1024.0);
|
|
271
|
+
|
|
272
|
+
if (num_generated_tokens == max_new_tokens) {
|
|
273
|
+
RUNNER_ET_LOG(generation_config.warming, "Max new tokens %i reached!",
|
|
274
|
+
max_new_tokens);
|
|
275
|
+
}
|
|
276
|
+
|
|
277
|
+
stats_.num_prompt_tokens = num_prompt_tokens;
|
|
278
|
+
stats_.num_generated_tokens = num_generated_tokens;
|
|
279
|
+
|
|
280
|
+
if (generation_config.warming) {
|
|
281
|
+
ET_LOG(Info, "Warmup run finished!");
|
|
282
|
+
} else {
|
|
283
|
+
// Do not print report during warmup
|
|
284
|
+
::executorch::llm::print_report(stats_);
|
|
285
|
+
}
|
|
286
|
+
if (stats_callback) {
|
|
287
|
+
stats_callback(stats_);
|
|
288
|
+
}
|
|
289
|
+
|
|
290
|
+
return Error::Ok;
|
|
291
|
+
}
|
|
292
|
+
|
|
293
|
+
Error Runner::warmup(const std::string &prompt) {
|
|
294
|
+
// Create a GenerationConfig for warmup
|
|
295
|
+
llm::GenerationConfig config{.echo = false, .warming = true};
|
|
296
|
+
|
|
297
|
+
// Call generate with the warmup config
|
|
298
|
+
Error err = generate(prompt, config,
|
|
299
|
+
/*token_callback=*/nullptr,
|
|
300
|
+
/*stats_callbak=*/nullptr);
|
|
301
|
+
|
|
302
|
+
// Reset stats after warmup
|
|
303
|
+
reset();
|
|
304
|
+
|
|
305
|
+
return err;
|
|
306
|
+
}
|
|
307
|
+
|
|
308
|
+
void Runner::stop() {
|
|
309
|
+
if (is_loaded()) {
|
|
310
|
+
text_token_generator_->stop();
|
|
311
|
+
} else {
|
|
312
|
+
ET_LOG(Error, "Token generator is not loaded, cannot stop");
|
|
313
|
+
}
|
|
314
|
+
}
|
|
315
|
+
|
|
316
|
+
void Runner::reset() {
|
|
317
|
+
stats_.reset();
|
|
318
|
+
pos_ = 0;
|
|
319
|
+
}
|
|
320
|
+
|
|
321
|
+
void Runner::set_count_interval(size_t count_interval) {
|
|
322
|
+
text_token_generator_->set_count_interval(count_interval);
|
|
323
|
+
}
|
|
324
|
+
|
|
325
|
+
void Runner::set_time_interval(size_t time_interval) {
|
|
326
|
+
text_token_generator_->set_time_interval(time_interval);
|
|
327
|
+
}
|
|
328
|
+
|
|
329
|
+
void Runner::set_temperature(float temperature) noexcept {
|
|
330
|
+
config_.temperature = temperature;
|
|
331
|
+
if (text_decoder_runner_) {
|
|
332
|
+
text_decoder_runner_->set_temperature(temperature);
|
|
333
|
+
}
|
|
334
|
+
}
|
|
335
|
+
|
|
336
|
+
void Runner::set_topp(float topp) noexcept {
|
|
337
|
+
config_.topp = topp;
|
|
338
|
+
if (text_decoder_runner_) {
|
|
339
|
+
text_decoder_runner_->set_topp(topp);
|
|
340
|
+
}
|
|
341
|
+
}
|
|
342
|
+
|
|
343
|
+
int32_t Runner::resolve_max_new_tokens(int32_t num_prompt_tokens,
|
|
344
|
+
int32_t max_seq_len,
|
|
345
|
+
int32_t max_context_len,
|
|
346
|
+
int32_t max_new_tokens) const {
|
|
347
|
+
int32_t result;
|
|
348
|
+
|
|
349
|
+
if (max_seq_len == -1 && max_new_tokens == -1) {
|
|
350
|
+
// Both are -1, use max context len minus prompt tokens
|
|
351
|
+
result = max_context_len - num_prompt_tokens;
|
|
352
|
+
} else if (max_seq_len == -1 && max_new_tokens != -1) {
|
|
353
|
+
// Only max_new_tokens is specified
|
|
354
|
+
result = std::min(max_new_tokens, max_context_len - num_prompt_tokens);
|
|
355
|
+
} else if (max_seq_len != -1 && max_new_tokens == -1) {
|
|
356
|
+
// Only seq_len is specified
|
|
357
|
+
result = std::min(max_seq_len, max_context_len) - num_prompt_tokens;
|
|
358
|
+
} else {
|
|
359
|
+
// Both are specified
|
|
360
|
+
result =
|
|
361
|
+
std::min(std::min(max_seq_len, max_context_len) - num_prompt_tokens,
|
|
362
|
+
max_new_tokens);
|
|
363
|
+
}
|
|
364
|
+
|
|
365
|
+
// Ensure result is not negative
|
|
366
|
+
return std::max(0, result);
|
|
367
|
+
}
|
|
368
|
+
|
|
369
|
+
} // namespace example
|
|
@@ -0,0 +1,85 @@
|
|
|
1
|
+
/*
|
|
2
|
+
* Copyright (c) Meta Platforms, Inc. and affiliates.
|
|
3
|
+
* All rights reserved.
|
|
4
|
+
*
|
|
5
|
+
* This source code is licensed under the BSD-style license found in the
|
|
6
|
+
* LICENSE file in the root directory of this source tree.
|
|
7
|
+
*/
|
|
8
|
+
|
|
9
|
+
// A simple llama2 runner that includes preprocessing and post processing logic.
|
|
10
|
+
// The module takes in a string as input and emits a string as output.
|
|
11
|
+
|
|
12
|
+
#pragma once
|
|
13
|
+
|
|
14
|
+
#include "irunner.h"
|
|
15
|
+
#include "stats.h"
|
|
16
|
+
#include "text_decoder_runner.h"
|
|
17
|
+
#include "text_prefiller.h"
|
|
18
|
+
#include "text_token_generator.h"
|
|
19
|
+
#include <cstdint>
|
|
20
|
+
#include <executorch/extension/module/module.h>
|
|
21
|
+
#include <functional>
|
|
22
|
+
#include <memory>
|
|
23
|
+
#include <optional>
|
|
24
|
+
#include <string>
|
|
25
|
+
#include <tokenizers-cpp/tokenizers_cpp.h>
|
|
26
|
+
#include <unordered_map>
|
|
27
|
+
|
|
28
|
+
namespace example {
|
|
29
|
+
|
|
30
|
+
namespace llm = ::executorch::extension::llm;
|
|
31
|
+
|
|
32
|
+
class Runner : public llm::IRunner {
|
|
33
|
+
public:
|
|
34
|
+
explicit Runner(::executorch::extension::Module *module,
|
|
35
|
+
const std::string &tokenizer_path,
|
|
36
|
+
const llm::GenerationConfig &config = {
|
|
37
|
+
.temperature = 0.8F, .topp = 0.9F}); // The main config
|
|
38
|
+
|
|
39
|
+
bool is_loaded() const override;
|
|
40
|
+
::executorch::runtime::Error load() override;
|
|
41
|
+
::executorch::runtime::Error generate(
|
|
42
|
+
const std::string &prompt,
|
|
43
|
+
const llm::GenerationConfig &generation_config =
|
|
44
|
+
{}, // An extra config which temporarily overrides previous model
|
|
45
|
+
// settings
|
|
46
|
+
std::function<void(const std::string &)> token_callback = {},
|
|
47
|
+
std::function<void(const llm::Stats &)> stats_callback = {}) override;
|
|
48
|
+
::executorch::runtime::Error warmup(const std::string &prompt);
|
|
49
|
+
void set_count_interval(size_t count_interval);
|
|
50
|
+
void set_time_interval(size_t time_interval);
|
|
51
|
+
void set_temperature(float temperature) noexcept;
|
|
52
|
+
void set_topp(float topp) noexcept;
|
|
53
|
+
|
|
54
|
+
void stop() override;
|
|
55
|
+
void reset() override;
|
|
56
|
+
|
|
57
|
+
llm::Stats stats_;
|
|
58
|
+
|
|
59
|
+
private:
|
|
60
|
+
// Helper functions
|
|
61
|
+
int32_t resolve_max_new_tokens(int32_t num_prompt_tokens, int32_t max_seq_len,
|
|
62
|
+
int32_t max_context_len,
|
|
63
|
+
int32_t max_new_tokens = -1) const;
|
|
64
|
+
|
|
65
|
+
// Main config
|
|
66
|
+
llm::GenerationConfig config_;
|
|
67
|
+
|
|
68
|
+
// Flow control
|
|
69
|
+
bool shouldStop_{false};
|
|
70
|
+
int64_t pos_ = 0; // The position in KV cache of the input, starting from 0.
|
|
71
|
+
|
|
72
|
+
// Main model
|
|
73
|
+
::executorch::extension::Module *module_;
|
|
74
|
+
|
|
75
|
+
// Subcomponents
|
|
76
|
+
std::string tokenizer_path_;
|
|
77
|
+
std::unique_ptr<tokenizers::Tokenizer> tokenizer_;
|
|
78
|
+
std::unordered_map<std::string, int64_t> metadata_;
|
|
79
|
+
std::unique_ptr<llm::IOManager> io_manager_;
|
|
80
|
+
std::unique_ptr<llm::TextDecoderRunner> text_decoder_runner_;
|
|
81
|
+
std::unique_ptr<llm::TextPrefiller> text_prefiller_;
|
|
82
|
+
std::unique_ptr<llm::TextTokenGenerator> text_token_generator_;
|
|
83
|
+
};
|
|
84
|
+
|
|
85
|
+
} // namespace example
|
|
@@ -0,0 +1,201 @@
|
|
|
1
|
+
/*
|
|
2
|
+
* Copyright (c) Meta Platforms, Inc. and affiliates.
|
|
3
|
+
* All rights reserved.
|
|
4
|
+
*
|
|
5
|
+
* This source code is licensed under the BSD-style license found in the
|
|
6
|
+
* LICENSE file in the root directory of this source tree.
|
|
7
|
+
*/
|
|
8
|
+
|
|
9
|
+
// This is a modified version of https://github.com/karpathy/llama2.c.git
|
|
10
|
+
// @lint-ignore-every LICENSELINT
|
|
11
|
+
/**
|
|
12
|
+
* MIT License
|
|
13
|
+
*
|
|
14
|
+
* Copyright (c) 2023 Andrej
|
|
15
|
+
*
|
|
16
|
+
* Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
17
|
+
* of this software and associated documentation files (the "Software"), to deal
|
|
18
|
+
* in the Software without restriction, including without limitation the rights
|
|
19
|
+
* to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
20
|
+
* copies of the Software, and to permit persons to whom the Software is
|
|
21
|
+
* furnished to do so, subject to the following conditions:
|
|
22
|
+
*
|
|
23
|
+
* The above copyright notice and this permission notice shall be included in
|
|
24
|
+
* all copies or substantial portions of the Software.
|
|
25
|
+
*
|
|
26
|
+
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
27
|
+
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
28
|
+
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
29
|
+
* AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
30
|
+
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
31
|
+
* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
|
|
32
|
+
* SOFTWARE.
|
|
33
|
+
*/
|
|
34
|
+
|
|
35
|
+
#include "sampler.h"
|
|
36
|
+
#include <algorithm>
|
|
37
|
+
#include <ctime>
|
|
38
|
+
|
|
39
|
+
namespace executorch {
|
|
40
|
+
namespace extension {
|
|
41
|
+
namespace llm {
|
|
42
|
+
|
|
43
|
+
// sampler stuff
|
|
44
|
+
template <typename T> int32_t Sampler::sample_argmax(T *probabilities) {
|
|
45
|
+
// return the index that has the highest probability
|
|
46
|
+
int max_i = 0;
|
|
47
|
+
T max_p = probabilities[0];
|
|
48
|
+
for (int i = 1; i < vocab_size_; i++) {
|
|
49
|
+
if (probabilities[i] > max_p) {
|
|
50
|
+
max_i = i;
|
|
51
|
+
max_p = probabilities[i];
|
|
52
|
+
}
|
|
53
|
+
}
|
|
54
|
+
return max_i;
|
|
55
|
+
}
|
|
56
|
+
|
|
57
|
+
template <typename T>
|
|
58
|
+
int32_t Sampler::sample_mult(T *probabilities, float coin) {
|
|
59
|
+
// sample index from probabilities (they must sum to 1!)
|
|
60
|
+
// coin is a random number in [0, 1), usually from random_f32()
|
|
61
|
+
T cdf = 0.0;
|
|
62
|
+
for (int i = 0; i < vocab_size_; i++) {
|
|
63
|
+
cdf += probabilities[i];
|
|
64
|
+
if (coin < cdf) {
|
|
65
|
+
return i;
|
|
66
|
+
}
|
|
67
|
+
}
|
|
68
|
+
return vocab_size_ - 1; // in case of rounding errors
|
|
69
|
+
}
|
|
70
|
+
|
|
71
|
+
template <typename T>
|
|
72
|
+
int32_t Sampler::sample_topp(T *probabilities, float coin) {
|
|
73
|
+
// top-p sampling (or "nucleus sampling") samples from the smallest set of
|
|
74
|
+
// tokens that exceed probability topp. This way we never sample tokens that
|
|
75
|
+
// have very low probabilities and are less likely to go "off the rails".
|
|
76
|
+
// coin is a random number in [0, 1), usually from random_f32()
|
|
77
|
+
int n = vocab_size_;
|
|
78
|
+
int n0 = 0;
|
|
79
|
+
// quicksort indices in descending order of probabilities
|
|
80
|
+
// values smaller than (1 - topp) / (n - 1) cannot be part of the result
|
|
81
|
+
// so for efficiency we crop these out as candidates before sorting
|
|
82
|
+
std::unique_ptr<ProbIndex<T>[]> probindex =
|
|
83
|
+
std::make_unique<ProbIndex<T>[]>(vocab_size_);
|
|
84
|
+
|
|
85
|
+
const float cutoff = (1.0f - topp_) / (n - 1);
|
|
86
|
+
for (int i = 0; i < n; i++) {
|
|
87
|
+
if (probabilities[i] >= cutoff) {
|
|
88
|
+
probindex[n0].index = i;
|
|
89
|
+
probindex[n0].prob = probabilities[i];
|
|
90
|
+
n0++;
|
|
91
|
+
}
|
|
92
|
+
}
|
|
93
|
+
|
|
94
|
+
auto compare = [](const ProbIndex<T> &a, const ProbIndex<T> &b) {
|
|
95
|
+
return a.prob > b.prob;
|
|
96
|
+
};
|
|
97
|
+
std::sort(probindex.get(), probindex.get() + n0, compare);
|
|
98
|
+
|
|
99
|
+
// truncate the list where cumulative probability exceeds topp
|
|
100
|
+
T cumulative_prob = 0;
|
|
101
|
+
int last_idx = n0 - 1; // in case of rounding errors consider all elements
|
|
102
|
+
for (int i = 0; i < n0; i++) {
|
|
103
|
+
cumulative_prob += probindex[i].prob;
|
|
104
|
+
if (cumulative_prob > topp_) {
|
|
105
|
+
last_idx = i;
|
|
106
|
+
break; // we've exceeded topp by including last_idx
|
|
107
|
+
}
|
|
108
|
+
}
|
|
109
|
+
|
|
110
|
+
// sample from the truncated list
|
|
111
|
+
const T &r = coin * cumulative_prob;
|
|
112
|
+
T cdf = 0;
|
|
113
|
+
for (int i = 0; i <= last_idx; i++) {
|
|
114
|
+
cdf += probindex[i].prob;
|
|
115
|
+
if (r < cdf) {
|
|
116
|
+
return probindex[i].index;
|
|
117
|
+
}
|
|
118
|
+
}
|
|
119
|
+
return probindex[last_idx].index; // in case of rounding errors
|
|
120
|
+
}
|
|
121
|
+
|
|
122
|
+
Sampler::Sampler(int vocab_size, float temperature, float topp,
|
|
123
|
+
unsigned long long rng_seed)
|
|
124
|
+
: vocab_size_(vocab_size),
|
|
125
|
+
inv_temperature_((temperature != 0.0f) ? (1.0f / temperature) : 0.0f),
|
|
126
|
+
topp_(topp), rng_state_(rng_seed) {}
|
|
127
|
+
|
|
128
|
+
Sampler::Sampler(int vocab_size, float temperature, float topp)
|
|
129
|
+
: vocab_size_(vocab_size),
|
|
130
|
+
inv_temperature_((temperature != 0.0f) ? (1.0f / temperature) : 0.0f),
|
|
131
|
+
topp_(topp), rng_state_(std::time(nullptr)) {}
|
|
132
|
+
|
|
133
|
+
template <typename T> static void softmax(T *x, int size) {
|
|
134
|
+
// find max value (for numerical stability)
|
|
135
|
+
T max_val = x[0];
|
|
136
|
+
for (int i = 1; i < size; i++) {
|
|
137
|
+
if (x[i] > max_val) {
|
|
138
|
+
max_val = x[i];
|
|
139
|
+
}
|
|
140
|
+
}
|
|
141
|
+
// exp and sum
|
|
142
|
+
T sum = 0;
|
|
143
|
+
for (int i = 0; i < size; i++) {
|
|
144
|
+
x[i] = expf(x[i] - max_val);
|
|
145
|
+
sum += x[i];
|
|
146
|
+
}
|
|
147
|
+
// normalize
|
|
148
|
+
for (int i = 0; i < size; i++) {
|
|
149
|
+
x[i] /= sum;
|
|
150
|
+
}
|
|
151
|
+
}
|
|
152
|
+
|
|
153
|
+
static unsigned int random_u32(unsigned long long *state) {
|
|
154
|
+
// xorshift rng: https://en.wikipedia.org/wiki/Xorshift#xorshift.2A
|
|
155
|
+
*state ^= *state >> 12;
|
|
156
|
+
*state ^= *state << 25;
|
|
157
|
+
*state ^= *state >> 27;
|
|
158
|
+
return (*state * 0x2545F4914F6CDD1Dull) >> 32;
|
|
159
|
+
}
|
|
160
|
+
|
|
161
|
+
static float random_f32(unsigned long long *state) { // random float32 in [0,1)
|
|
162
|
+
return (random_u32(state) >> 8) / 16777216.0f;
|
|
163
|
+
}
|
|
164
|
+
|
|
165
|
+
template <typename T> int32_t Sampler::sample(T *logits) {
|
|
166
|
+
// sample the token given the logits and some hyperparameters
|
|
167
|
+
int next;
|
|
168
|
+
if (inv_temperature_ == 0.0f) {
|
|
169
|
+
// greedy argmax sampling: take the token with the highest probability
|
|
170
|
+
next = sample_argmax(logits);
|
|
171
|
+
} else {
|
|
172
|
+
// apply the temperature to the logits
|
|
173
|
+
for (int q = 0; q < vocab_size_; q++) {
|
|
174
|
+
logits[q] *= inv_temperature_;
|
|
175
|
+
}
|
|
176
|
+
// apply softmax to the logits to get the probabilities for next token
|
|
177
|
+
softmax(logits, vocab_size_);
|
|
178
|
+
// flip a (float) coin (this is our source of entropy for sampling)
|
|
179
|
+
float coin = random_f32(&rng_state_);
|
|
180
|
+
// we sample from this distribution to get the next token
|
|
181
|
+
if (topp_ <= 0 || topp_ >= 1) {
|
|
182
|
+
// simply sample from the predicted probability distribution
|
|
183
|
+
next = sample_mult(logits, coin);
|
|
184
|
+
} else {
|
|
185
|
+
// top-p (nucleus) sampling, clamping the least likely tokens to zero
|
|
186
|
+
next = sample_topp(logits, coin);
|
|
187
|
+
}
|
|
188
|
+
}
|
|
189
|
+
return next;
|
|
190
|
+
}
|
|
191
|
+
|
|
192
|
+
template int32_t Sampler::sample<float>(float *logits);
|
|
193
|
+
template int32_t Sampler::sample<uint16_t>(uint16_t *logits);
|
|
194
|
+
template int32_t
|
|
195
|
+
Sampler::sample<executorch::aten::Half>(executorch::aten::Half *logits);
|
|
196
|
+
template int32_t
|
|
197
|
+
Sampler::sample<executorch::aten::BFloat16>(executorch::aten::BFloat16 *logits);
|
|
198
|
+
|
|
199
|
+
} // namespace llm
|
|
200
|
+
} // namespace extension
|
|
201
|
+
} // namespace executorch
|