react-native-executorch 0.5.1-rc.0 → 0.5.2
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +132 -0
- package/common/rnexecutorch/models/speech_to_text/SpeechToText.cpp +4 -10
- package/common/rnexecutorch/models/speech_to_text/SpeechToText.h +1 -1
- package/common/rnexecutorch/models/speech_to_text/SpeechToTextStrategy.h +3 -2
- package/common/rnexecutorch/models/speech_to_text/WhisperStrategy.cpp +16 -4
- package/common/rnexecutorch/models/speech_to_text/WhisperStrategy.h +2 -2
- package/lib/Error.d.ts +30 -0
- package/lib/Error.js +50 -0
- package/lib/constants/directories.d.ts +1 -0
- package/lib/constants/directories.js +2 -0
- package/lib/constants/llmDefaults.d.ts +6 -0
- package/lib/constants/llmDefaults.js +16 -0
- package/lib/constants/modelUrls.d.ts +217 -83
- package/lib/constants/modelUrls.js +304 -98
- package/lib/constants/ocr/models.d.ts +882 -0
- package/lib/constants/ocr/models.js +182 -0
- package/lib/constants/ocr/symbols.d.ts +75 -0
- package/lib/constants/ocr/symbols.js +139 -0
- package/lib/{typescript/constants → constants}/sttDefaults.d.ts +0 -1
- package/lib/constants/sttDefaults.js +12 -10
- package/lib/controllers/LLMController.d.ts +47 -0
- package/lib/controllers/LLMController.js +14 -11
- package/lib/controllers/OCRController.d.ts +23 -0
- package/lib/controllers/OCRController.js +12 -5
- package/lib/controllers/SpeechToTextController.d.ts +8 -4
- package/lib/controllers/SpeechToTextController.js +15 -9
- package/lib/controllers/VerticalOCRController.d.ts +25 -0
- package/lib/controllers/VerticalOCRController.js +75 -0
- package/lib/hooks/computer_vision/useClassification.d.ts +15 -0
- package/lib/hooks/computer_vision/useClassification.js +7 -0
- package/lib/hooks/computer_vision/useImageEmbeddings.d.ts +15 -0
- package/lib/hooks/computer_vision/useImageEmbeddings.js +7 -0
- package/lib/hooks/computer_vision/useImageSegmentation.d.ts +38 -0
- package/lib/hooks/computer_vision/useImageSegmentation.js +7 -0
- package/lib/hooks/computer_vision/useOCR.d.ts +20 -0
- package/lib/hooks/computer_vision/useOCR.js +42 -0
- package/lib/hooks/computer_vision/useObjectDetection.d.ts +15 -0
- package/lib/hooks/computer_vision/useObjectDetection.js +7 -0
- package/lib/hooks/computer_vision/useStyleTransfer.d.ts +15 -0
- package/lib/hooks/computer_vision/useStyleTransfer.js +7 -0
- package/lib/hooks/computer_vision/useVerticalOCR.d.ts +21 -0
- package/lib/hooks/computer_vision/useVerticalOCR.js +45 -0
- package/lib/hooks/general/useExecutorchModule.d.ts +13 -0
- package/lib/hooks/general/useExecutorchModule.js +7 -0
- package/lib/hooks/natural_language_processing/useLLM.d.ts +10 -0
- package/lib/hooks/natural_language_processing/useLLM.js +78 -0
- package/lib/hooks/natural_language_processing/useSpeechToText.d.ts +27 -0
- package/lib/hooks/natural_language_processing/useSpeechToText.js +19 -14
- package/lib/hooks/natural_language_processing/useTextEmbeddings.d.ts +16 -0
- package/lib/hooks/natural_language_processing/useTextEmbeddings.js +7 -0
- package/lib/hooks/natural_language_processing/useTokenizer.d.ts +17 -0
- package/lib/hooks/natural_language_processing/useTokenizer.js +52 -0
- package/lib/hooks/useModule.d.ts +17 -0
- package/lib/hooks/useModule.js +45 -0
- package/lib/hooks/useNonStaticModule.d.ts +20 -0
- package/lib/hooks/useNonStaticModule.js +49 -0
- package/lib/index.d.ts +1 -1
- package/lib/index.js +3 -2
- package/lib/module/constants/modelUrls.js +61 -36
- package/lib/module/constants/modelUrls.js.map +1 -1
- package/lib/module/constants/ocr/models.js +1 -1
- package/lib/module/hooks/natural_language_processing/useSpeechToText.js +71 -34
- package/lib/module/hooks/natural_language_processing/useSpeechToText.js.map +1 -1
- package/lib/module/index.js +2 -3
- package/lib/module/index.js.map +1 -1
- package/lib/module/modules/natural_language_processing/SpeechToTextModule.js +72 -31
- package/lib/module/modules/natural_language_processing/SpeechToTextModule.js.map +1 -1
- package/lib/module/types/stt.js +1 -85
- package/lib/module/types/stt.js.map +1 -1
- package/lib/module/utils/ResourceFetcher.js +6 -8
- package/lib/module/utils/ResourceFetcher.js.map +1 -1
- package/lib/module/utils/ResourceFetcherUtils.js +20 -20
- package/lib/module/utils/ResourceFetcherUtils.js.map +1 -1
- package/lib/module/utils/SpeechToTextModule/ASR.js +191 -0
- package/lib/module/utils/SpeechToTextModule/ASR.js.map +1 -0
- package/lib/module/utils/SpeechToTextModule/OnlineProcessor.js +73 -0
- package/lib/module/utils/SpeechToTextModule/OnlineProcessor.js.map +1 -0
- package/lib/module/utils/SpeechToTextModule/hypothesisBuffer.js +56 -0
- package/lib/module/utils/SpeechToTextModule/hypothesisBuffer.js.map +1 -0
- package/lib/modules/BaseModule.d.ts +8 -0
- package/lib/modules/BaseModule.js +25 -0
- package/lib/modules/BaseNonStaticModule.d.ts +9 -0
- package/lib/modules/BaseNonStaticModule.js +14 -0
- package/lib/modules/computer_vision/ClassificationModule.d.ts +8 -0
- package/lib/modules/computer_vision/ClassificationModule.js +17 -0
- package/lib/modules/computer_vision/ImageEmbeddingsModule.d.ts +8 -0
- package/lib/modules/computer_vision/ImageEmbeddingsModule.js +17 -0
- package/lib/modules/computer_vision/ImageSegmentationModule.d.ts +11 -0
- package/lib/modules/computer_vision/ImageSegmentationModule.js +27 -0
- package/lib/modules/computer_vision/OCRModule.d.ts +15 -0
- package/lib/modules/computer_vision/OCRModule.js +20 -0
- package/lib/modules/computer_vision/ObjectDetectionModule.d.ts +9 -0
- package/lib/modules/computer_vision/ObjectDetectionModule.js +17 -0
- package/lib/modules/computer_vision/StyleTransferModule.d.ts +8 -0
- package/lib/modules/computer_vision/StyleTransferModule.js +17 -0
- package/lib/modules/computer_vision/VerticalOCRModule.d.ts +15 -0
- package/lib/modules/computer_vision/VerticalOCRModule.js +22 -0
- package/lib/modules/general/ExecutorchModule.d.ts +7 -0
- package/lib/modules/general/ExecutorchModule.js +14 -0
- package/lib/modules/natural_language_processing/LLMModule.d.ts +28 -0
- package/lib/modules/natural_language_processing/LLMModule.js +45 -0
- package/lib/modules/natural_language_processing/SpeechToTextModule.d.ts +18 -8
- package/lib/modules/natural_language_processing/SpeechToTextModule.js +21 -15
- package/lib/modules/natural_language_processing/TextEmbeddingsModule.d.ts +9 -0
- package/lib/modules/natural_language_processing/TextEmbeddingsModule.js +21 -0
- package/lib/modules/natural_language_processing/TokenizerModule.d.ts +12 -0
- package/lib/modules/natural_language_processing/TokenizerModule.js +5 -4
- package/lib/native/NativeETInstaller.d.ts +6 -0
- package/lib/native/NativeETInstaller.js +2 -0
- package/lib/native/NativeOCR.d.ts +8 -0
- package/lib/native/NativeOCR.js +2 -0
- package/lib/native/NativeVerticalOCR.d.ts +8 -0
- package/lib/native/NativeVerticalOCR.js +2 -0
- package/lib/types/common.d.ts +31 -0
- package/lib/types/common.js +25 -0
- package/lib/types/imageSegmentation.d.ts +24 -0
- package/lib/types/imageSegmentation.js +26 -0
- package/lib/types/llm.d.ts +46 -0
- package/lib/types/llm.js +9 -0
- package/lib/types/objectDetection.d.ts +104 -0
- package/lib/types/objectDetection.js +94 -0
- package/lib/types/ocr.d.ts +11 -0
- package/lib/types/ocr.js +1 -0
- package/lib/types/stt.d.ts +94 -0
- package/lib/types/stt.js +85 -0
- package/lib/typescript/constants/modelUrls.d.ts +24 -7
- package/lib/typescript/constants/modelUrls.d.ts.map +1 -1
- package/lib/typescript/constants/ocr/models.d.ts +126 -126
- package/lib/typescript/hooks/natural_language_processing/useSpeechToText.d.ts +15 -24
- package/lib/typescript/hooks/natural_language_processing/useSpeechToText.d.ts.map +1 -1
- package/lib/typescript/index.d.ts +2 -3
- package/lib/typescript/index.d.ts.map +1 -1
- package/lib/typescript/modules/natural_language_processing/SpeechToTextModule.d.ts +19 -22
- package/lib/typescript/modules/natural_language_processing/SpeechToTextModule.d.ts.map +1 -1
- package/lib/typescript/types/stt.d.ts +17 -91
- package/lib/typescript/types/stt.d.ts.map +1 -1
- package/lib/typescript/utils/ResourceFetcher.d.ts.map +1 -1
- package/lib/typescript/utils/ResourceFetcherUtils.d.ts.map +1 -1
- package/lib/typescript/utils/SpeechToTextModule/ASR.d.ts +27 -0
- package/lib/typescript/utils/SpeechToTextModule/ASR.d.ts.map +1 -0
- package/lib/typescript/utils/SpeechToTextModule/OnlineProcessor.d.ts +23 -0
- package/lib/typescript/utils/SpeechToTextModule/OnlineProcessor.d.ts.map +1 -0
- package/lib/typescript/utils/SpeechToTextModule/hypothesisBuffer.d.ts +13 -0
- package/lib/typescript/utils/SpeechToTextModule/hypothesisBuffer.d.ts.map +1 -0
- package/lib/utils/ResourceFetcher.d.ts +24 -0
- package/lib/utils/ResourceFetcher.js +305 -0
- package/lib/utils/ResourceFetcherUtils.d.ts +54 -0
- package/lib/utils/ResourceFetcherUtils.js +9 -0
- package/lib/utils/llm.d.ts +6 -0
- package/lib/utils/llm.js +1 -0
- package/lib/utils/stt.d.ts +1 -0
- package/lib/utils/stt.js +21 -0
- package/package.json +5 -3
- package/src/constants/modelUrls.ts +70 -37
- package/src/constants/ocr/models.ts +1 -1
- package/src/hooks/natural_language_processing/useSpeechToText.ts +87 -92
- package/src/index.ts +6 -8
- package/src/modules/natural_language_processing/SpeechToTextModule.ts +81 -69
- package/src/types/stt.ts +97 -92
- package/src/utils/ResourceFetcher.ts +9 -7
- package/src/utils/ResourceFetcherUtils.ts +15 -17
- package/src/utils/SpeechToTextModule/ASR.ts +303 -0
- package/src/utils/SpeechToTextModule/OnlineProcessor.ts +87 -0
- package/src/utils/SpeechToTextModule/hypothesisBuffer.ts +79 -0
- package/common/rnexecutorch/models/speech_to_text/MoonshineStrategy.cpp +0 -31
- package/common/rnexecutorch/models/speech_to_text/MoonshineStrategy.h +0 -21
- package/lib/module/constants/sttDefaults.js +0 -74
- package/lib/module/constants/sttDefaults.js.map +0 -1
- package/lib/module/controllers/SpeechToTextController.js +0 -320
- package/lib/module/controllers/SpeechToTextController.js.map +0 -1
- package/lib/typescript/constants/sttDefaults.d.ts.map +0 -1
- package/lib/typescript/controllers/SpeechToTextController.d.ts +0 -57
- package/lib/typescript/controllers/SpeechToTextController.d.ts.map +0 -1
- package/src/constants/sttDefaults.ts +0 -82
- package/src/controllers/SpeechToTextController.ts +0 -471
- package/third-party/ios/ExecutorchLib/ExecutorchLib.xcodeproj/project.xcworkspace/contents.xcworkspacedata +0 -7
- package/third-party/ios/ExecutorchLib/ExecutorchLib.xcodeproj/project.xcworkspace/xcuserdata/norbertklockiewicz.xcuserdatad/UserInterfaceState.xcuserstate +0 -0
- package/third-party/ios/ExecutorchLib/ExecutorchLib.xcodeproj/xcuserdata/norbertklockiewicz.xcuserdatad/xcschemes/xcschememanagement.plist +0 -14
|
@@ -0,0 +1,94 @@
|
|
|
1
|
+
var CocoLabel;
|
|
2
|
+
(function (CocoLabel) {
|
|
3
|
+
CocoLabel[CocoLabel["PERSON"] = 1] = "PERSON";
|
|
4
|
+
CocoLabel[CocoLabel["BICYCLE"] = 2] = "BICYCLE";
|
|
5
|
+
CocoLabel[CocoLabel["CAR"] = 3] = "CAR";
|
|
6
|
+
CocoLabel[CocoLabel["MOTORCYCLE"] = 4] = "MOTORCYCLE";
|
|
7
|
+
CocoLabel[CocoLabel["AIRPLANE"] = 5] = "AIRPLANE";
|
|
8
|
+
CocoLabel[CocoLabel["BUS"] = 6] = "BUS";
|
|
9
|
+
CocoLabel[CocoLabel["TRAIN"] = 7] = "TRAIN";
|
|
10
|
+
CocoLabel[CocoLabel["TRUCK"] = 8] = "TRUCK";
|
|
11
|
+
CocoLabel[CocoLabel["BOAT"] = 9] = "BOAT";
|
|
12
|
+
CocoLabel[CocoLabel["TRAFFIC_LIGHT"] = 10] = "TRAFFIC_LIGHT";
|
|
13
|
+
CocoLabel[CocoLabel["FIRE_HYDRANT"] = 11] = "FIRE_HYDRANT";
|
|
14
|
+
CocoLabel[CocoLabel["STREET_SIGN"] = 12] = "STREET_SIGN";
|
|
15
|
+
CocoLabel[CocoLabel["STOP_SIGN"] = 13] = "STOP_SIGN";
|
|
16
|
+
CocoLabel[CocoLabel["PARKING"] = 14] = "PARKING";
|
|
17
|
+
CocoLabel[CocoLabel["BENCH"] = 15] = "BENCH";
|
|
18
|
+
CocoLabel[CocoLabel["BIRD"] = 16] = "BIRD";
|
|
19
|
+
CocoLabel[CocoLabel["CAT"] = 17] = "CAT";
|
|
20
|
+
CocoLabel[CocoLabel["DOG"] = 18] = "DOG";
|
|
21
|
+
CocoLabel[CocoLabel["HORSE"] = 19] = "HORSE";
|
|
22
|
+
CocoLabel[CocoLabel["SHEEP"] = 20] = "SHEEP";
|
|
23
|
+
CocoLabel[CocoLabel["COW"] = 21] = "COW";
|
|
24
|
+
CocoLabel[CocoLabel["ELEPHANT"] = 22] = "ELEPHANT";
|
|
25
|
+
CocoLabel[CocoLabel["BEAR"] = 23] = "BEAR";
|
|
26
|
+
CocoLabel[CocoLabel["ZEBRA"] = 24] = "ZEBRA";
|
|
27
|
+
CocoLabel[CocoLabel["GIRAFFE"] = 25] = "GIRAFFE";
|
|
28
|
+
CocoLabel[CocoLabel["HAT"] = 26] = "HAT";
|
|
29
|
+
CocoLabel[CocoLabel["BACKPACK"] = 27] = "BACKPACK";
|
|
30
|
+
CocoLabel[CocoLabel["UMBRELLA"] = 28] = "UMBRELLA";
|
|
31
|
+
CocoLabel[CocoLabel["SHOE"] = 29] = "SHOE";
|
|
32
|
+
CocoLabel[CocoLabel["EYE"] = 30] = "EYE";
|
|
33
|
+
CocoLabel[CocoLabel["HANDBAG"] = 31] = "HANDBAG";
|
|
34
|
+
CocoLabel[CocoLabel["TIE"] = 32] = "TIE";
|
|
35
|
+
CocoLabel[CocoLabel["SUITCASE"] = 33] = "SUITCASE";
|
|
36
|
+
CocoLabel[CocoLabel["FRISBEE"] = 34] = "FRISBEE";
|
|
37
|
+
CocoLabel[CocoLabel["SKIS"] = 35] = "SKIS";
|
|
38
|
+
CocoLabel[CocoLabel["SNOWBOARD"] = 36] = "SNOWBOARD";
|
|
39
|
+
CocoLabel[CocoLabel["SPORTS"] = 37] = "SPORTS";
|
|
40
|
+
CocoLabel[CocoLabel["KITE"] = 38] = "KITE";
|
|
41
|
+
CocoLabel[CocoLabel["BASEBALL"] = 39] = "BASEBALL";
|
|
42
|
+
CocoLabel[CocoLabel["SKATEBOARD"] = 41] = "SKATEBOARD";
|
|
43
|
+
CocoLabel[CocoLabel["SURFBOARD"] = 42] = "SURFBOARD";
|
|
44
|
+
CocoLabel[CocoLabel["TENNIS_RACKET"] = 43] = "TENNIS_RACKET";
|
|
45
|
+
CocoLabel[CocoLabel["BOTTLE"] = 44] = "BOTTLE";
|
|
46
|
+
CocoLabel[CocoLabel["PLATE"] = 45] = "PLATE";
|
|
47
|
+
CocoLabel[CocoLabel["WINE_GLASS"] = 46] = "WINE_GLASS";
|
|
48
|
+
CocoLabel[CocoLabel["CUP"] = 47] = "CUP";
|
|
49
|
+
CocoLabel[CocoLabel["FORK"] = 48] = "FORK";
|
|
50
|
+
CocoLabel[CocoLabel["KNIFE"] = 49] = "KNIFE";
|
|
51
|
+
CocoLabel[CocoLabel["SPOON"] = 50] = "SPOON";
|
|
52
|
+
CocoLabel[CocoLabel["BOWL"] = 51] = "BOWL";
|
|
53
|
+
CocoLabel[CocoLabel["BANANA"] = 52] = "BANANA";
|
|
54
|
+
CocoLabel[CocoLabel["APPLE"] = 53] = "APPLE";
|
|
55
|
+
CocoLabel[CocoLabel["SANDWICH"] = 54] = "SANDWICH";
|
|
56
|
+
CocoLabel[CocoLabel["ORANGE"] = 55] = "ORANGE";
|
|
57
|
+
CocoLabel[CocoLabel["BROCCOLI"] = 56] = "BROCCOLI";
|
|
58
|
+
CocoLabel[CocoLabel["CARROT"] = 57] = "CARROT";
|
|
59
|
+
CocoLabel[CocoLabel["HOT_DOG"] = 58] = "HOT_DOG";
|
|
60
|
+
CocoLabel[CocoLabel["PIZZA"] = 59] = "PIZZA";
|
|
61
|
+
CocoLabel[CocoLabel["DONUT"] = 60] = "DONUT";
|
|
62
|
+
CocoLabel[CocoLabel["CAKE"] = 61] = "CAKE";
|
|
63
|
+
CocoLabel[CocoLabel["CHAIR"] = 62] = "CHAIR";
|
|
64
|
+
CocoLabel[CocoLabel["COUCH"] = 63] = "COUCH";
|
|
65
|
+
CocoLabel[CocoLabel["POTTED_PLANT"] = 64] = "POTTED_PLANT";
|
|
66
|
+
CocoLabel[CocoLabel["BED"] = 65] = "BED";
|
|
67
|
+
CocoLabel[CocoLabel["MIRROR"] = 66] = "MIRROR";
|
|
68
|
+
CocoLabel[CocoLabel["DINING_TABLE"] = 67] = "DINING_TABLE";
|
|
69
|
+
CocoLabel[CocoLabel["WINDOW"] = 68] = "WINDOW";
|
|
70
|
+
CocoLabel[CocoLabel["DESK"] = 69] = "DESK";
|
|
71
|
+
CocoLabel[CocoLabel["TOILET"] = 70] = "TOILET";
|
|
72
|
+
CocoLabel[CocoLabel["DOOR"] = 71] = "DOOR";
|
|
73
|
+
CocoLabel[CocoLabel["TV"] = 72] = "TV";
|
|
74
|
+
CocoLabel[CocoLabel["LAPTOP"] = 73] = "LAPTOP";
|
|
75
|
+
CocoLabel[CocoLabel["MOUSE"] = 74] = "MOUSE";
|
|
76
|
+
CocoLabel[CocoLabel["REMOTE"] = 75] = "REMOTE";
|
|
77
|
+
CocoLabel[CocoLabel["KEYBOARD"] = 76] = "KEYBOARD";
|
|
78
|
+
CocoLabel[CocoLabel["CELL_PHONE"] = 77] = "CELL_PHONE";
|
|
79
|
+
CocoLabel[CocoLabel["MICROWAVE"] = 78] = "MICROWAVE";
|
|
80
|
+
CocoLabel[CocoLabel["OVEN"] = 79] = "OVEN";
|
|
81
|
+
CocoLabel[CocoLabel["TOASTER"] = 80] = "TOASTER";
|
|
82
|
+
CocoLabel[CocoLabel["SINK"] = 81] = "SINK";
|
|
83
|
+
CocoLabel[CocoLabel["REFRIGERATOR"] = 82] = "REFRIGERATOR";
|
|
84
|
+
CocoLabel[CocoLabel["BLENDER"] = 83] = "BLENDER";
|
|
85
|
+
CocoLabel[CocoLabel["BOOK"] = 84] = "BOOK";
|
|
86
|
+
CocoLabel[CocoLabel["CLOCK"] = 85] = "CLOCK";
|
|
87
|
+
CocoLabel[CocoLabel["VASE"] = 86] = "VASE";
|
|
88
|
+
CocoLabel[CocoLabel["SCISSORS"] = 87] = "SCISSORS";
|
|
89
|
+
CocoLabel[CocoLabel["TEDDY_BEAR"] = 88] = "TEDDY_BEAR";
|
|
90
|
+
CocoLabel[CocoLabel["HAIR_DRIER"] = 89] = "HAIR_DRIER";
|
|
91
|
+
CocoLabel[CocoLabel["TOOTHBRUSH"] = 90] = "TOOTHBRUSH";
|
|
92
|
+
CocoLabel[CocoLabel["HAIR_BRUSH"] = 91] = "HAIR_BRUSH";
|
|
93
|
+
})(CocoLabel || (CocoLabel = {}));
|
|
94
|
+
export {};
|
package/lib/types/ocr.js
ADDED
|
@@ -0,0 +1 @@
|
|
|
1
|
+
export {};
|
|
@@ -0,0 +1,94 @@
|
|
|
1
|
+
export interface ModelConfig {
|
|
2
|
+
sources: {
|
|
3
|
+
encoder: string;
|
|
4
|
+
decoder: string;
|
|
5
|
+
};
|
|
6
|
+
tokenizer: {
|
|
7
|
+
source: string;
|
|
8
|
+
bos: number;
|
|
9
|
+
eos: number;
|
|
10
|
+
};
|
|
11
|
+
isMultilingual: boolean;
|
|
12
|
+
}
|
|
13
|
+
export declare enum SpeechToTextLanguage {
|
|
14
|
+
Afrikaans = "af",
|
|
15
|
+
Albanian = "sq",
|
|
16
|
+
Arabic = "ar",
|
|
17
|
+
Armenian = "hy",
|
|
18
|
+
Azerbaijani = "az",
|
|
19
|
+
Basque = "eu",
|
|
20
|
+
Belarusian = "be",
|
|
21
|
+
Bengali = "bn",
|
|
22
|
+
Bosnian = "bs",
|
|
23
|
+
Bulgarian = "bg",
|
|
24
|
+
Burmese = "my",
|
|
25
|
+
Catalan = "ca",
|
|
26
|
+
Chinese = "zh",
|
|
27
|
+
Croatian = "hr",
|
|
28
|
+
Czech = "cs",
|
|
29
|
+
Danish = "da",
|
|
30
|
+
Dutch = "nl",
|
|
31
|
+
Estonian = "et",
|
|
32
|
+
English = "en",
|
|
33
|
+
Finnish = "fi",
|
|
34
|
+
French = "fr",
|
|
35
|
+
Galician = "gl",
|
|
36
|
+
Georgian = "ka",
|
|
37
|
+
German = "de",
|
|
38
|
+
Greek = "el",
|
|
39
|
+
Gujarati = "gu",
|
|
40
|
+
HaitianCreole = "ht",
|
|
41
|
+
Hebrew = "he",
|
|
42
|
+
Hindi = "hi",
|
|
43
|
+
Hungarian = "hu",
|
|
44
|
+
Icelandic = "is",
|
|
45
|
+
Indonesian = "id",
|
|
46
|
+
Italian = "it",
|
|
47
|
+
Japanese = "ja",
|
|
48
|
+
Kannada = "kn",
|
|
49
|
+
Kazakh = "kk",
|
|
50
|
+
Khmer = "km",
|
|
51
|
+
Korean = "ko",
|
|
52
|
+
Lao = "lo",
|
|
53
|
+
Latvian = "lv",
|
|
54
|
+
Lithuanian = "lt",
|
|
55
|
+
Macedonian = "mk",
|
|
56
|
+
Malagasy = "mg",
|
|
57
|
+
Malay = "ms",
|
|
58
|
+
Malayalam = "ml",
|
|
59
|
+
Maltese = "mt",
|
|
60
|
+
Marathi = "mr",
|
|
61
|
+
Nepali = "ne",
|
|
62
|
+
Norwegian = "no",
|
|
63
|
+
Persian = "fa",
|
|
64
|
+
Polish = "pl",
|
|
65
|
+
Portuguese = "pt",
|
|
66
|
+
Punjabi = "pa",
|
|
67
|
+
Romanian = "ro",
|
|
68
|
+
Russian = "ru",
|
|
69
|
+
Serbian = "sr",
|
|
70
|
+
Sinhala = "si",
|
|
71
|
+
Slovak = "sk",
|
|
72
|
+
Slovenian = "sl",
|
|
73
|
+
Spanish = "es",
|
|
74
|
+
Sundanese = "su",
|
|
75
|
+
Swahili = "sw",
|
|
76
|
+
Swedish = "sv",
|
|
77
|
+
Tagalog = "tl",
|
|
78
|
+
Tajik = "tg",
|
|
79
|
+
Tamil = "ta",
|
|
80
|
+
Telugu = "te",
|
|
81
|
+
Thai = "th",
|
|
82
|
+
Turkish = "tr",
|
|
83
|
+
Ukrainian = "uk",
|
|
84
|
+
Urdu = "ur",
|
|
85
|
+
Uzbek = "uz",
|
|
86
|
+
Vietnamese = "vi",
|
|
87
|
+
Welsh = "cy",
|
|
88
|
+
Yiddish = "yi"
|
|
89
|
+
}
|
|
90
|
+
export declare enum AvailableModels {
|
|
91
|
+
WHISPER = "whisper",
|
|
92
|
+
MOONSHINE = "moonshine",
|
|
93
|
+
WHISPER_MULTILINGUAL = "whisperMultilingual"
|
|
94
|
+
}
|
package/lib/types/stt.js
ADDED
|
@@ -0,0 +1,85 @@
|
|
|
1
|
+
// Those languages are supported just by whisper multilingual
|
|
2
|
+
export var SpeechToTextLanguage;
|
|
3
|
+
(function (SpeechToTextLanguage) {
|
|
4
|
+
SpeechToTextLanguage["Afrikaans"] = "af";
|
|
5
|
+
SpeechToTextLanguage["Albanian"] = "sq";
|
|
6
|
+
SpeechToTextLanguage["Arabic"] = "ar";
|
|
7
|
+
SpeechToTextLanguage["Armenian"] = "hy";
|
|
8
|
+
SpeechToTextLanguage["Azerbaijani"] = "az";
|
|
9
|
+
SpeechToTextLanguage["Basque"] = "eu";
|
|
10
|
+
SpeechToTextLanguage["Belarusian"] = "be";
|
|
11
|
+
SpeechToTextLanguage["Bengali"] = "bn";
|
|
12
|
+
SpeechToTextLanguage["Bosnian"] = "bs";
|
|
13
|
+
SpeechToTextLanguage["Bulgarian"] = "bg";
|
|
14
|
+
SpeechToTextLanguage["Burmese"] = "my";
|
|
15
|
+
SpeechToTextLanguage["Catalan"] = "ca";
|
|
16
|
+
SpeechToTextLanguage["Chinese"] = "zh";
|
|
17
|
+
SpeechToTextLanguage["Croatian"] = "hr";
|
|
18
|
+
SpeechToTextLanguage["Czech"] = "cs";
|
|
19
|
+
SpeechToTextLanguage["Danish"] = "da";
|
|
20
|
+
SpeechToTextLanguage["Dutch"] = "nl";
|
|
21
|
+
SpeechToTextLanguage["Estonian"] = "et";
|
|
22
|
+
SpeechToTextLanguage["English"] = "en";
|
|
23
|
+
SpeechToTextLanguage["Finnish"] = "fi";
|
|
24
|
+
SpeechToTextLanguage["French"] = "fr";
|
|
25
|
+
SpeechToTextLanguage["Galician"] = "gl";
|
|
26
|
+
SpeechToTextLanguage["Georgian"] = "ka";
|
|
27
|
+
SpeechToTextLanguage["German"] = "de";
|
|
28
|
+
SpeechToTextLanguage["Greek"] = "el";
|
|
29
|
+
SpeechToTextLanguage["Gujarati"] = "gu";
|
|
30
|
+
SpeechToTextLanguage["HaitianCreole"] = "ht";
|
|
31
|
+
SpeechToTextLanguage["Hebrew"] = "he";
|
|
32
|
+
SpeechToTextLanguage["Hindi"] = "hi";
|
|
33
|
+
SpeechToTextLanguage["Hungarian"] = "hu";
|
|
34
|
+
SpeechToTextLanguage["Icelandic"] = "is";
|
|
35
|
+
SpeechToTextLanguage["Indonesian"] = "id";
|
|
36
|
+
SpeechToTextLanguage["Italian"] = "it";
|
|
37
|
+
SpeechToTextLanguage["Japanese"] = "ja";
|
|
38
|
+
SpeechToTextLanguage["Kannada"] = "kn";
|
|
39
|
+
SpeechToTextLanguage["Kazakh"] = "kk";
|
|
40
|
+
SpeechToTextLanguage["Khmer"] = "km";
|
|
41
|
+
SpeechToTextLanguage["Korean"] = "ko";
|
|
42
|
+
SpeechToTextLanguage["Lao"] = "lo";
|
|
43
|
+
SpeechToTextLanguage["Latvian"] = "lv";
|
|
44
|
+
SpeechToTextLanguage["Lithuanian"] = "lt";
|
|
45
|
+
SpeechToTextLanguage["Macedonian"] = "mk";
|
|
46
|
+
SpeechToTextLanguage["Malagasy"] = "mg";
|
|
47
|
+
SpeechToTextLanguage["Malay"] = "ms";
|
|
48
|
+
SpeechToTextLanguage["Malayalam"] = "ml";
|
|
49
|
+
SpeechToTextLanguage["Maltese"] = "mt";
|
|
50
|
+
SpeechToTextLanguage["Marathi"] = "mr";
|
|
51
|
+
SpeechToTextLanguage["Nepali"] = "ne";
|
|
52
|
+
SpeechToTextLanguage["Norwegian"] = "no";
|
|
53
|
+
SpeechToTextLanguage["Persian"] = "fa";
|
|
54
|
+
SpeechToTextLanguage["Polish"] = "pl";
|
|
55
|
+
SpeechToTextLanguage["Portuguese"] = "pt";
|
|
56
|
+
SpeechToTextLanguage["Punjabi"] = "pa";
|
|
57
|
+
SpeechToTextLanguage["Romanian"] = "ro";
|
|
58
|
+
SpeechToTextLanguage["Russian"] = "ru";
|
|
59
|
+
SpeechToTextLanguage["Serbian"] = "sr";
|
|
60
|
+
SpeechToTextLanguage["Sinhala"] = "si";
|
|
61
|
+
SpeechToTextLanguage["Slovak"] = "sk";
|
|
62
|
+
SpeechToTextLanguage["Slovenian"] = "sl";
|
|
63
|
+
SpeechToTextLanguage["Spanish"] = "es";
|
|
64
|
+
SpeechToTextLanguage["Sundanese"] = "su";
|
|
65
|
+
SpeechToTextLanguage["Swahili"] = "sw";
|
|
66
|
+
SpeechToTextLanguage["Swedish"] = "sv";
|
|
67
|
+
SpeechToTextLanguage["Tagalog"] = "tl";
|
|
68
|
+
SpeechToTextLanguage["Tajik"] = "tg";
|
|
69
|
+
SpeechToTextLanguage["Tamil"] = "ta";
|
|
70
|
+
SpeechToTextLanguage["Telugu"] = "te";
|
|
71
|
+
SpeechToTextLanguage["Thai"] = "th";
|
|
72
|
+
SpeechToTextLanguage["Turkish"] = "tr";
|
|
73
|
+
SpeechToTextLanguage["Ukrainian"] = "uk";
|
|
74
|
+
SpeechToTextLanguage["Urdu"] = "ur";
|
|
75
|
+
SpeechToTextLanguage["Uzbek"] = "uz";
|
|
76
|
+
SpeechToTextLanguage["Vietnamese"] = "vi";
|
|
77
|
+
SpeechToTextLanguage["Welsh"] = "cy";
|
|
78
|
+
SpeechToTextLanguage["Yiddish"] = "yi";
|
|
79
|
+
})(SpeechToTextLanguage || (SpeechToTextLanguage = {}));
|
|
80
|
+
export var AvailableModels;
|
|
81
|
+
(function (AvailableModels) {
|
|
82
|
+
AvailableModels["WHISPER"] = "whisper";
|
|
83
|
+
AvailableModels["MOONSHINE"] = "moonshine";
|
|
84
|
+
AvailableModels["WHISPER_MULTILINGUAL"] = "whisperMultilingual";
|
|
85
|
+
})(AvailableModels || (AvailableModels = {}));
|
|
@@ -1,4 +1,3 @@
|
|
|
1
|
-
import { AvailableModels } from '../types/stt';
|
|
2
1
|
export declare const LLAMA3_2_3B: {
|
|
3
2
|
modelSource: string;
|
|
4
3
|
tokenizerSource: string;
|
|
@@ -177,22 +176,40 @@ export declare const STYLE_TRANSFER_RAIN_PRINCESS: {
|
|
|
177
176
|
export declare const STYLE_TRANSFER_UDNIE: {
|
|
178
177
|
modelSource: string;
|
|
179
178
|
};
|
|
180
|
-
export declare const
|
|
181
|
-
|
|
179
|
+
export declare const WHISPER_TINY_EN: {
|
|
180
|
+
isMultilingual: boolean;
|
|
181
|
+
encoderSource: string;
|
|
182
182
|
decoderSource: string;
|
|
183
|
+
tokenizerSource: string;
|
|
184
|
+
};
|
|
185
|
+
export declare const WHISPER_BASE_EN: {
|
|
186
|
+
isMultilingual: boolean;
|
|
183
187
|
encoderSource: string;
|
|
188
|
+
decoderSource: string;
|
|
184
189
|
tokenizerSource: string;
|
|
185
190
|
};
|
|
186
|
-
export declare const
|
|
187
|
-
|
|
191
|
+
export declare const WHISPER_SMALL_EN: {
|
|
192
|
+
isMultilingual: boolean;
|
|
193
|
+
encoderSource: string;
|
|
188
194
|
decoderSource: string;
|
|
195
|
+
tokenizerSource: string;
|
|
196
|
+
};
|
|
197
|
+
export declare const WHISPER_TINY: {
|
|
198
|
+
isMultilingual: boolean;
|
|
189
199
|
encoderSource: string;
|
|
200
|
+
decoderSource: string;
|
|
190
201
|
tokenizerSource: string;
|
|
191
202
|
};
|
|
192
|
-
export declare const
|
|
193
|
-
|
|
203
|
+
export declare const WHISPER_BASE: {
|
|
204
|
+
isMultilingual: boolean;
|
|
205
|
+
encoderSource: string;
|
|
194
206
|
decoderSource: string;
|
|
207
|
+
tokenizerSource: string;
|
|
208
|
+
};
|
|
209
|
+
export declare const WHISPER_SMALL: {
|
|
210
|
+
isMultilingual: boolean;
|
|
195
211
|
encoderSource: string;
|
|
212
|
+
decoderSource: string;
|
|
196
213
|
tokenizerSource: string;
|
|
197
214
|
};
|
|
198
215
|
export declare const DEEPLAB_V3_RESNET50: {
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"modelUrls.d.ts","sourceRoot":"","sources":["../../../src/constants/modelUrls.ts"],"names":[],"mappings":"
|
|
1
|
+
{"version":3,"file":"modelUrls.d.ts","sourceRoot":"","sources":["../../../src/constants/modelUrls.ts"],"names":[],"mappings":"AAkBA,eAAO,MAAM,WAAW;;;;CAIvB,CAAC;AAEF,eAAO,MAAM,iBAAiB;;;;CAI7B,CAAC;AAEF,eAAO,MAAM,qBAAqB;;;;CAIjC,CAAC;AAEF,eAAO,MAAM,WAAW;;;;CAIvB,CAAC;AAEF,eAAO,MAAM,iBAAiB;;;;CAI7B,CAAC;AAEF,eAAO,MAAM,qBAAqB;;;;CAIjC,CAAC;AAYF,eAAO,MAAM,UAAU;;;;CAItB,CAAC;AAEF,eAAO,MAAM,oBAAoB;;;;CAIhC,CAAC;AAEF,eAAO,MAAM,UAAU;;;;CAItB,CAAC;AAEF,eAAO,MAAM,oBAAoB;;;;CAIhC,CAAC;AAEF,eAAO,MAAM,QAAQ;;;;CAIpB,CAAC;AAEF,eAAO,MAAM,kBAAkB;;;;CAI9B,CAAC;AAYF,eAAO,MAAM,cAAc;;;;CAI1B,CAAC;AAEF,eAAO,MAAM,wBAAwB;;;;CAIpC,CAAC;AAEF,eAAO,MAAM,cAAc;;;;CAI1B,CAAC;AAEF,eAAO,MAAM,wBAAwB;;;;CAIpC,CAAC;AAEF,eAAO,MAAM,YAAY;;;;CAIxB,CAAC;AAEF,eAAO,MAAM,sBAAsB;;;;CAIlC,CAAC;AAYF,eAAO,MAAM,cAAc;;;;CAI1B,CAAC;AAEF,eAAO,MAAM,wBAAwB;;;;CAIpC,CAAC;AAEF,eAAO,MAAM,cAAc;;;;CAI1B,CAAC;AAEF,eAAO,MAAM,wBAAwB;;;;CAIpC,CAAC;AAEF,eAAO,MAAM,cAAc;;;;CAI1B,CAAC;AAEF,eAAO,MAAM,wBAAwB;;;;CAIpC,CAAC;AAYF,eAAO,MAAM,YAAY;;;;CAIxB,CAAC;AAEF,eAAO,MAAM,sBAAsB;;;;CAIlC,CAAC;AAEF,eAAO,MAAM,YAAY;;;;CAIxB,CAAC;AAEF,eAAO,MAAM,sBAAsB;;;;CAIlC,CAAC;AAEF,eAAO,MAAM,UAAU;;;;CAItB,CAAC;AAEF,eAAO,MAAM,oBAAoB;;;;CAIhC,CAAC;AAQF,eAAO,MAAM,aAAa;;;;CAIzB,CAAC;AAEF,eAAO,MAAM,uBAAuB;;;;CAInC,CAAC;AAQF,eAAO,MAAM,iBAAiB;;CAE7B,CAAC;AAKF,eAAO,MAAM,8BAA8B;;CAE1C,CAAC;AAoBF,eAAO,MAAM,oBAAoB;;CAEhC,CAAC;AAEF,eAAO,MAAM,qBAAqB;;CAEjC,CAAC;AAEF,eAAO,MAAM,4BAA4B;;CAExC,CAAC;AAEF,eAAO,MAAM,oBAAoB;;CAEhC,CAAC;AA2BF,eAAO,MAAM,eAAe;;;;;CAK3B,CAAC;AAEF,eAAO,MAAM,eAAe;;;;;CAK3B,CAAC;AAEF,eAAO,MAAM,gBAAgB;;;;;CAK5B,CAAC;AAEF,eAAO,MAAM,YAAY;;;;;CAKxB,CAAC;AAEF,eAAO,MAAM,YAAY;;;;;CAKxB,CAAC;AAEF,eAAO,MAAM,aAAa;;;;;CAKzB,CAAC;AAKF,eAAO,MAAM,mBAAmB;;CAE/B,CAAC;AAKF,eAAO,MAAM,2BAA2B;;CAEvC,CAAC;AAcF,eAAO,MAAM,gBAAgB;;;CAG5B,CAAC;AAEF,eAAO,MAAM,iBAAiB;;;CAG7B,CAAC;AAEF,eAAO,MAAM,yBAAyB;;;CAGrC,CAAC;AAEF,eAAO,MAAM,0BAA0B;;;CAGtC,CAAC;AAEF,eAAO,MAAM,0BAA0B;;;CAGtC,CAAC"}
|