npm - react-native-sherpa-onnx - Versions diffs - 0.3.2 → 0.3.4 - Mend

react-native-sherpa-onnx 0.3.2 → 0.3.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (83) hide show

package/README.md +84 -77
package/SherpaOnnx.podspec +79 -45
package/android/build.gradle +8 -2
package/android/prebuilt-download.gradle +70 -16
package/android/prebuilt-versions.gradle +14 -6
package/android/src/main/cpp/CMakeLists.txt +2 -0
package/android/src/main/cpp/jni/audio/sherpa-onnx-audio-convert-jni.cpp +202 -328
package/android/src/main/cpp/jni/model_detect/sherpa-onnx-detect-jni-common.cpp +22 -0
package/android/src/main/cpp/jni/model_detect/sherpa-onnx-detect-jni-common.h +2 -0
package/android/src/main/cpp/jni/model_detect/sherpa-onnx-model-detect-helper.cpp +96 -142
package/android/src/main/cpp/jni/model_detect/sherpa-onnx-model-detect-helper.h +40 -4
package/android/src/main/cpp/jni/model_detect/sherpa-onnx-model-detect-stt.cpp +774 -316
package/android/src/main/cpp/jni/model_detect/sherpa-onnx-model-detect-tts.cpp +208 -122
package/android/src/main/cpp/jni/model_detect/sherpa-onnx-model-detect.h +92 -0
package/android/src/main/cpp/jni/model_detect/sherpa-onnx-stt-wrapper.cpp +3 -0
package/android/src/main/cpp/jni/model_detect/sherpa-onnx-tts-wrapper.cpp +14 -2
package/android/src/main/cpp/jni/model_detect/sherpa-onnx-validate-stt.cpp +229 -0
package/android/src/main/cpp/jni/model_detect/sherpa-onnx-validate-stt.h +38 -0
package/android/src/main/cpp/jni/model_detect/sherpa-onnx-validate-tts.cpp +144 -0
package/android/src/main/cpp/jni/model_detect/sherpa-onnx-validate-tts.h +38 -0
package/android/src/main/cpp/jni/module/sherpa-onnx-module-jni.cpp +1 -1
package/android/src/main/java/com/sherpaonnx/SherpaOnnxModule.kt +157 -11
package/android/src/main/java/com/sherpaonnx/SherpaOnnxPcmCapture.kt +150 -0
package/android/src/main/java/com/sherpaonnx/SherpaOnnxSttHelper.kt +75 -24
package/android/src/main/java/com/sherpaonnx/SherpaOnnxTtsHelper.kt +52 -1
package/ios/SherpaOnnx+PcmLiveStream.mm +288 -0
package/ios/SherpaOnnx+STT.mm +2 -0
package/ios/SherpaOnnx+TTS.mm +17 -0
package/ios/SherpaOnnx.mm +27 -3
package/ios/SherpaOnnxAudioConvert.h +28 -0
package/ios/SherpaOnnxAudioConvert.mm +698 -0
package/ios/archive/sherpa-onnx-archive-helper.mm +12 -0
package/ios/model_detect/sherpa-onnx-model-detect-helper.h +37 -3
package/ios/model_detect/sherpa-onnx-model-detect-helper.mm +80 -45
package/ios/model_detect/sherpa-onnx-model-detect-stt.mm +629 -267
package/ios/model_detect/sherpa-onnx-model-detect-tts.mm +148 -56
package/ios/model_detect/sherpa-onnx-model-detect.h +72 -0
package/ios/model_detect/sherpa-onnx-validate-stt.h +38 -0
package/ios/model_detect/sherpa-onnx-validate-stt.mm +229 -0
package/ios/model_detect/sherpa-onnx-validate-tts.h +38 -0
package/ios/model_detect/sherpa-onnx-validate-tts.mm +144 -0
package/ios/stt/sherpa-onnx-stt-wrapper.mm +4 -0
package/lib/module/NativeSherpaOnnx.js.map +1 -1
package/lib/module/audio/index.js +55 -1
package/lib/module/audio/index.js.map +1 -1
package/lib/module/download/ModelDownloadManager.js +14 -0
package/lib/module/download/ModelDownloadManager.js.map +1 -1
package/lib/module/index.js +10 -0
package/lib/module/index.js.map +1 -1
package/lib/module/stt/streaming.js +6 -3
package/lib/module/stt/streaming.js.map +1 -1
package/lib/module/tts/index.js +13 -1
package/lib/module/tts/index.js.map +1 -1
package/lib/typescript/src/NativeSherpaOnnx.d.ts +32 -3
package/lib/typescript/src/NativeSherpaOnnx.d.ts.map +1 -1
package/lib/typescript/src/audio/index.d.ts +20 -1
package/lib/typescript/src/audio/index.d.ts.map +1 -1
package/lib/typescript/src/download/ModelDownloadManager.d.ts +2 -1
package/lib/typescript/src/download/ModelDownloadManager.d.ts.map +1 -1
package/lib/typescript/src/index.d.ts +10 -0
package/lib/typescript/src/index.d.ts.map +1 -1
package/lib/typescript/src/stt/streaming.d.ts.map +1 -1
package/lib/typescript/src/stt/streamingTypes.d.ts +1 -1
package/lib/typescript/src/stt/streamingTypes.d.ts.map +1 -1
package/lib/typescript/src/tts/index.d.ts +12 -1
package/lib/typescript/src/tts/index.d.ts.map +1 -1
package/package.json +6 -1
package/scripts/check-model-csvs.sh +72 -0
package/scripts/setup-ios-framework.sh +272 -191
package/src/NativeSherpaOnnx.ts +37 -3
package/src/audio/index.ts +84 -1
package/src/download/ModelDownloadManager.ts +19 -0
package/src/index.tsx +15 -0
package/src/stt/streaming.ts +10 -5
package/src/stt/streamingTypes.ts +1 -1
package/src/tts/index.ts +25 -1
package/third_party/ffmpeg_prebuilt/ANDROID_RELEASE_TAG +1 -1
package/third_party/libarchive_prebuilt/ANDROID_RELEASE_TAG +1 -1
package/third_party/libarchive_prebuilt/IOS_RELEASE_TAG +1 -1
package/third_party/sherpa-onnx-prebuilt/ANDROID_RELEASE_TAG +1 -1
package/third_party/sherpa-onnx-prebuilt/IOS_RELEASE_TAG +1 -1
package/ios/scripts/patch-libarchive-includes.sh +0 -61
package/ios/scripts/setup-ios-libarchive.sh +0 -98

package/ios/archive/sherpa-onnx-archive-helper.mm CHANGED Viewed

@@ -6,8 +6,10 @@
  */
 #import "sherpa-onnx-archive-helper.h"
+#ifdef HAVE_LIBARCHIVE
 #import <archive.h>
 #import <archive_entry.h>
+#endif
 #import <CommonCrypto/CommonCrypto.h>
 #include <array>
 #include <atomic>
@@ -17,6 +19,7 @@
 static std::atomic_bool g_cancelExtract(false);
 namespace {
+#ifdef HAVE_LIBARCHIVE
 struct ArchiveReadContext {
   FILE* file = nullptr;
   std::array<unsigned char, 64 * 1024> buffer{};
@@ -66,6 +69,7 @@ static void DrainRemainingAndClose(ArchiveReadContext* ctx) {
   fclose(ctx->file);
   ctx->file = nullptr;
 }
+#endif
 static NSString* HexStringFromDigest(const unsigned char* digest, size_t size) {
   static const char* kHex = "0123456789abcdef";
@@ -122,7 +126,11 @@ static NSString* ComputeFileSha256(NSString* filePath, NSError** error) {
 + (void)cancelExtractTarBz2
 {
+#ifdef HAVE_LIBARCHIVE
   g_cancelExtract.store(true);
+#else
+  // feature disabled
+#endif
 }
 - (NSDictionary *)extractTarBz2:(NSString *)sourcePath
@@ -130,6 +138,9 @@ static NSString* ComputeFileSha256(NSString* filePath, NSError** error) {
            force:(BOOL)force
            progress:(SherpaOnnxArchiveProgressBlock)progress
 {
+#ifndef HAVE_LIBARCHIVE
+  return @{ @"success": @NO, @"reason": @"libarchive is disabled in this build. Rebuild without SHERPA_ONNX_DISABLE_LIBARCHIVE=1." };
+#else
   g_cancelExtract.store(false);
   NSFileManager *fileManager = [NSFileManager defaultManager];
@@ -285,6 +296,7 @@ static NSString* ComputeFileSha256(NSString* filePath, NSError** error) {
   NSString *sha256Hex = HexStringFromDigest(digest, CC_SHA256_DIGEST_LENGTH);
   return @{ @"success": @YES, @"path": targetPath, @"sha256": sha256Hex ?: @"" };
+#endif
 }
 - (NSString *)computeFileSha256:(NSString *)filePath

package/ios/model_detect/sherpa-onnx-model-detect-helper.h CHANGED Viewed

@@ -21,12 +21,11 @@ std::vector<std::string> ListDirectories(const std::string& path);
 std::vector<FileEntry> ListFiles(const std::string& path);
 std::vector<FileEntry> ListFilesRecursive(const std::string& path, int maxDepth);
 std::string ToLower(std::string value);
-std::string ResolveTokenizerDir(const std::string& modelDir);
-std::string FindFileByName(const std::string& baseDir, const std::string& fileName, int maxDepth);
+/** Find file in \p files whose name equals \p fileName (case-insensitive). Uses file tree only, no filesystem. */
+std::string FindFileByName(const std::vector<FileEntry>& files, const std::string& fileName);
 /** Find file whose name equals or ends with suffix (e.g. tokens.txt, tiny-tokens.txt) in a pre-built file list. */
 std::string FindFileEndingWith(const std::vector<FileEntry>& files, const std::string& suffix);
-std::string FindDirectoryByName(const std::string& baseDir, const std::string& dirName, int maxDepth);
 std::string FindOnnxByToken(
     const std::vector<FileEntry>& files,
@@ -38,6 +37,13 @@ std::string FindOnnxByAnyToken(
     const std::vector<std::string>& tokens,
     const std::optional<bool>& preferInt8
 );
+/** Like FindOnnxByAnyToken but skips any file whose nameLower contains any of \p excludeInName. */
+std::string FindOnnxByAnyTokenExcluding(
+    const std::vector<FileEntry>& files,
+    const std::vector<std::string>& tokens,
+    const std::vector<std::string>& excludeInName,
+    const std::optional<bool>& preferInt8
+);
 std::string FindLargestOnnxExcludingTokens(
     const std::vector<FileEntry>& files,
     const std::vector<std::string>& excludeTokens
@@ -46,6 +52,34 @@ std::string FindLargestOnnxExcludingTokens(
 /** Returns true if \p word appears in \p haystack as a standalone token (surrounded by separators: / - _ . space). */
 bool ContainsWord(const std::string& haystack, const std::string& word);
+/**
+ * Find a directory with the given name anywhere under \p rootDir in the file tree.
+ * Searches \p files for any path that starts with \p rootDir and contains "/dirName/".
+ * Returns the full path to that directory (e.g. rootDir/inner/dirName) or empty if not found.
+ * Used e.g. to find espeak-ng-data in modelDir or in modelDir/inner-model-dir/.
+ */
+std::string FindDirectoryUnderRoot(
+    const std::vector<FileEntry>& files,
+    const std::string& rootDir,
+    const std::string& dirName
+);
+/** Lexicon file with optional language id for multi-lang TTS (e.g. Kokoro). */
+struct LexiconCandidate {
+    std::string path;       /**< Full path to the lexicon file */
+    std::string languageId; /**< From filename: "default" for lexicon.txt, else e.g. "us-en", "zh" from lexicon-us-en.txt, lexicon-zh.txt */
+};
+/**
+ * Find all lexicon files under \p rootDir: exact "lexicon.txt" and any "lexicon-*.txt".
+ * Returns a list of LexiconCandidate (path + languageId), ordered: lexicon.txt first (as "default"),
+ * then lexicon-*.txt alphabetically by language id. Used for multi-language Kokoro/Kitten TTS.
+ */
+std::vector<LexiconCandidate> FindLexiconCandidates(
+    const std::vector<FileEntry>& files,
+    const std::string& rootDir
+);
 } // namespace model_detect
 } // namespace sherpaonnx

package/ios/model_detect/sherpa-onnx-model-detect-helper.mm CHANGED Viewed

@@ -30,12 +30,16 @@ bool ContainsToken(const std::string& value, const std::string& token) {
     return value.find(token) != std::string::npos;
 }
+static bool IsOnnxOrOrtFile(const FileEntry& entry) {
+    return EndsWith(entry.nameLower, ".onnx") || EndsWith(entry.nameLower, ".ort");
+}
 std::string ChooseLargest(const std::vector<FileEntry>& files,
     const std::vector<std::string>& excludeTokens, bool onlyInt8, bool onlyNonInt8) {
     std::string chosen;
     std::uint64_t bestSize = 0;
     for (const auto& entry : files) {
-        if (!EndsWith(entry.nameLower, ".onnx")) continue;
+        if (!IsOnnxOrOrtFile(entry)) continue;
         bool hasExcluded = false;
         for (const auto& token : excludeTokens) {
             if (ContainsToken(entry.nameLower, token)) { hasExcluded = true; break; }
@@ -115,7 +119,7 @@ std::string FindOnnxByToken(const std::vector<FileEntry>& files,
     std::string tokenLower = ToLower(token);
     std::vector<FileEntry> matches;
     for (const auto& entry : files) {
-        if (!EndsWith(entry.nameLower, ".onnx")) continue;
+        if (!IsOnnxOrOrtFile(entry)) continue;
         if (ContainsToken(entry.nameLower, tokenLower)) matches.push_back(entry);
     }
     if (matches.empty()) return "";
@@ -136,6 +140,37 @@ std::string FindOnnxByAnyToken(const std::vector<FileEntry>& files,
     return "";
 }
+std::string FindOnnxByAnyTokenExcluding(const std::vector<FileEntry>& files,
+    const std::vector<std::string>& tokens, const std::vector<std::string>& excludeInName,
+    const std::optional<bool>& preferInt8) {
+    for (const auto& token : tokens) {
+        std::string tokenLower = ToLower(token);
+        std::vector<FileEntry> matches;
+        for (const auto& entry : files) {
+            if (!IsOnnxOrOrtFile(entry)) continue;
+            if (!ContainsToken(entry.nameLower, tokenLower)) continue;
+            bool excluded = false;
+            for (const auto& ex : excludeInName) {
+                std::string exLower = ToLower(ex);
+                if (ContainsToken(entry.nameLower, exLower)) {
+                    excluded = true;
+                    break;
+                }
+            }
+            if (!excluded) matches.push_back(entry);
+        }
+        if (matches.empty()) continue;
+        std::vector<std::string> emptyTokens;
+        bool wantInt8 = preferInt8.has_value() && preferInt8.value();
+        bool wantNonInt8 = preferInt8.has_value() && !preferInt8.value();
+        std::string chosen = ChooseLargest(matches, emptyTokens, wantInt8, wantNonInt8);
+        if (!chosen.empty()) return chosen;
+        chosen = ChooseLargest(matches, emptyTokens, false, false);
+        if (!chosen.empty()) return chosen;
+    }
+    return "";
+}
 std::string FindFileEndingWith(const std::vector<FileEntry>& files, const std::string& suffix) {
     std::string targetSuffix = ToLower(suffix);
     for (const auto& entry : files) {
@@ -147,9 +182,8 @@ std::string FindFileEndingWith(const std::vector<FileEntry>& files, const std::s
     return "";
 }
-std::string FindFileByName(const std::string& baseDir, const std::string& fileName, int maxDepth) {
+std::string FindFileByName(const std::vector<FileEntry>& files, const std::string& fileName) {
     std::string target = ToLower(fileName);
-    auto files = ListFilesRecursive(baseDir, maxDepth);
     for (const auto& entry : files) {
         if (entry.nameLower == target) return entry.path;
     }
@@ -172,54 +206,55 @@ bool ContainsWord(const std::string& haystack, const std::string& word) {
     return false;
 }
-std::string FindDirectoryByName(const std::string& baseDir, const std::string& dirName, int maxDepth) {
-    std::string target = ToLower(dirName);
-    std::vector<std::string> toVisit = ListDirectories(baseDir);
-    int depth = 0;
-    while (!toVisit.empty() && depth <= maxDepth) {
-        std::vector<std::string> next;
-        for (const auto& dir : toVisit) {
-            std::string name = fs::path(dir).filename().string();
-            if (ToLower(name) == target) return dir;
-            if (depth < maxDepth) {
-                auto nested = ListDirectories(dir);
-                next.insert(next.end(), nested.begin(), nested.end());
-            }
+std::string FindDirectoryUnderRoot(
+    const std::vector<FileEntry>& files,
+    const std::string& rootDir,
+    const std::string& dirName
+) {
+    if (dirName.empty()) return "";
+    const std::string needle = "/" + dirName + "/";
+    const size_t dirPathLen = 1 + dirName.size();
+    for (const auto& entry : files) {
+        if (entry.path.size() < rootDir.size() + needle.size()) continue;
+        if (entry.path.compare(0, rootDir.size(), rootDir) != 0) continue;
+        size_t pos = entry.path.find(needle, rootDir.size());
+        if (pos != std::string::npos) {
+            return entry.path.substr(0, pos + dirPathLen);
         }
-        toVisit.swap(next);
-        depth += 1;
     }
     return "";
 }
-std::string ResolveTokenizerDir(const std::string& modelDir) {
-    std::string vocabInMain = modelDir + "/vocab.json";
-    if (FileExists(vocabInMain)) {
-        return modelDir;
-    }
-    try {
-        for (const auto& entry : fs::directory_iterator(modelDir)) {
-            if (entry.is_directory()) {
-                std::string dirName = entry.path().filename().string();
-                std::string dirNameLower = ToLower(dirName);
-                if (dirNameLower.find("qwen3") != std::string::npos) {
-                    std::string vocabPath = entry.path().string() + "/vocab.json";
-                    if (FileExists(vocabPath)) {
-                        return entry.path().string();
-                    }
-                }
-            }
+std::vector<LexiconCandidate> FindLexiconCandidates(
+    const std::vector<FileEntry>& files,
+    const std::string& rootDir
+) {
+    std::vector<LexiconCandidate> candidates;
+    const size_t rootLen = rootDir.size();
+    for (const auto& entry : files) {
+        if (entry.path.size() <= rootLen) continue;
+        if (rootLen > 0) {
+            if (entry.path.compare(0, rootLen, rootDir) != 0) continue;
+            // Enforce path boundary: if rootDir doesn't end with '/', require '/' after it
+            if (rootDir.back() != '/' && entry.path[rootLen] != '/') continue;
+        }
+        const std::string& baseLower = entry.nameLower;
+        if (baseLower == "lexicon.txt") {
+            candidates.push_back({entry.path, "default"});
+        } else if (baseLower.size() > 12 &&
+                   baseLower.compare(0, 8, "lexicon-") == 0 &&
+                   baseLower.compare(baseLower.size() - 4, 4, ".txt") == 0) {
+            std::string languageId = baseLower.substr(8, baseLower.size() - 12);
+            candidates.push_back({entry.path, languageId});
         }
-    } catch (const std::exception&) {
-    }
-    std::string commonPath = modelDir + "/Qwen3-0.6B";
-    if (FileExists(commonPath + "/vocab.json")) {
-        return commonPath;
     }
-    return "";
+    std::sort(candidates.begin(), candidates.end(), [](const LexiconCandidate& a, const LexiconCandidate& b) {
+        if (a.languageId == b.languageId) return a.path < b.path;
+        if (a.languageId == "default") return true;
+        if (b.languageId == "default") return false;
+        return a.languageId < b.languageId;
+    });
+    return candidates;
 }
 } // namespace model_detect