npm - react-native-sherpa-onnx - Versions diffs - 0.3.2 → 0.3.4 - Mend

react-native-sherpa-onnx 0.3.2 → 0.3.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (83) hide show

package/README.md +84 -77
package/SherpaOnnx.podspec +79 -45
package/android/build.gradle +8 -2
package/android/prebuilt-download.gradle +70 -16
package/android/prebuilt-versions.gradle +14 -6
package/android/src/main/cpp/CMakeLists.txt +2 -0
package/android/src/main/cpp/jni/audio/sherpa-onnx-audio-convert-jni.cpp +202 -328
package/android/src/main/cpp/jni/model_detect/sherpa-onnx-detect-jni-common.cpp +22 -0
package/android/src/main/cpp/jni/model_detect/sherpa-onnx-detect-jni-common.h +2 -0
package/android/src/main/cpp/jni/model_detect/sherpa-onnx-model-detect-helper.cpp +96 -142
package/android/src/main/cpp/jni/model_detect/sherpa-onnx-model-detect-helper.h +40 -4
package/android/src/main/cpp/jni/model_detect/sherpa-onnx-model-detect-stt.cpp +774 -316
package/android/src/main/cpp/jni/model_detect/sherpa-onnx-model-detect-tts.cpp +208 -122
package/android/src/main/cpp/jni/model_detect/sherpa-onnx-model-detect.h +92 -0
package/android/src/main/cpp/jni/model_detect/sherpa-onnx-stt-wrapper.cpp +3 -0
package/android/src/main/cpp/jni/model_detect/sherpa-onnx-tts-wrapper.cpp +14 -2
package/android/src/main/cpp/jni/model_detect/sherpa-onnx-validate-stt.cpp +229 -0
package/android/src/main/cpp/jni/model_detect/sherpa-onnx-validate-stt.h +38 -0
package/android/src/main/cpp/jni/model_detect/sherpa-onnx-validate-tts.cpp +144 -0
package/android/src/main/cpp/jni/model_detect/sherpa-onnx-validate-tts.h +38 -0
package/android/src/main/cpp/jni/module/sherpa-onnx-module-jni.cpp +1 -1
package/android/src/main/java/com/sherpaonnx/SherpaOnnxModule.kt +157 -11
package/android/src/main/java/com/sherpaonnx/SherpaOnnxPcmCapture.kt +150 -0
package/android/src/main/java/com/sherpaonnx/SherpaOnnxSttHelper.kt +75 -24
package/android/src/main/java/com/sherpaonnx/SherpaOnnxTtsHelper.kt +52 -1
package/ios/SherpaOnnx+PcmLiveStream.mm +288 -0
package/ios/SherpaOnnx+STT.mm +2 -0
package/ios/SherpaOnnx+TTS.mm +17 -0
package/ios/SherpaOnnx.mm +27 -3
package/ios/SherpaOnnxAudioConvert.h +28 -0
package/ios/SherpaOnnxAudioConvert.mm +698 -0
package/ios/archive/sherpa-onnx-archive-helper.mm +12 -0
package/ios/model_detect/sherpa-onnx-model-detect-helper.h +37 -3
package/ios/model_detect/sherpa-onnx-model-detect-helper.mm +80 -45
package/ios/model_detect/sherpa-onnx-model-detect-stt.mm +629 -267
package/ios/model_detect/sherpa-onnx-model-detect-tts.mm +148 -56
package/ios/model_detect/sherpa-onnx-model-detect.h +72 -0
package/ios/model_detect/sherpa-onnx-validate-stt.h +38 -0
package/ios/model_detect/sherpa-onnx-validate-stt.mm +229 -0
package/ios/model_detect/sherpa-onnx-validate-tts.h +38 -0
package/ios/model_detect/sherpa-onnx-validate-tts.mm +144 -0
package/ios/stt/sherpa-onnx-stt-wrapper.mm +4 -0
package/lib/module/NativeSherpaOnnx.js.map +1 -1
package/lib/module/audio/index.js +55 -1
package/lib/module/audio/index.js.map +1 -1
package/lib/module/download/ModelDownloadManager.js +14 -0
package/lib/module/download/ModelDownloadManager.js.map +1 -1
package/lib/module/index.js +10 -0
package/lib/module/index.js.map +1 -1
package/lib/module/stt/streaming.js +6 -3
package/lib/module/stt/streaming.js.map +1 -1
package/lib/module/tts/index.js +13 -1
package/lib/module/tts/index.js.map +1 -1
package/lib/typescript/src/NativeSherpaOnnx.d.ts +32 -3
package/lib/typescript/src/NativeSherpaOnnx.d.ts.map +1 -1
package/lib/typescript/src/audio/index.d.ts +20 -1
package/lib/typescript/src/audio/index.d.ts.map +1 -1
package/lib/typescript/src/download/ModelDownloadManager.d.ts +2 -1
package/lib/typescript/src/download/ModelDownloadManager.d.ts.map +1 -1
package/lib/typescript/src/index.d.ts +10 -0
package/lib/typescript/src/index.d.ts.map +1 -1
package/lib/typescript/src/stt/streaming.d.ts.map +1 -1
package/lib/typescript/src/stt/streamingTypes.d.ts +1 -1
package/lib/typescript/src/stt/streamingTypes.d.ts.map +1 -1
package/lib/typescript/src/tts/index.d.ts +12 -1
package/lib/typescript/src/tts/index.d.ts.map +1 -1
package/package.json +6 -1
package/scripts/check-model-csvs.sh +72 -0
package/scripts/setup-ios-framework.sh +272 -191
package/src/NativeSherpaOnnx.ts +37 -3
package/src/audio/index.ts +84 -1
package/src/download/ModelDownloadManager.ts +19 -0
package/src/index.tsx +15 -0
package/src/stt/streaming.ts +10 -5
package/src/stt/streamingTypes.ts +1 -1
package/src/tts/index.ts +25 -1
package/third_party/ffmpeg_prebuilt/ANDROID_RELEASE_TAG +1 -1
package/third_party/libarchive_prebuilt/ANDROID_RELEASE_TAG +1 -1
package/third_party/libarchive_prebuilt/IOS_RELEASE_TAG +1 -1
package/third_party/sherpa-onnx-prebuilt/ANDROID_RELEASE_TAG +1 -1
package/third_party/sherpa-onnx-prebuilt/IOS_RELEASE_TAG +1 -1
package/ios/scripts/patch-libarchive-includes.sh +0 -61
package/ios/scripts/setup-ios-libarchive.sh +0 -98

package/ios/SherpaOnnx+PcmLiveStream.mm ADDED Viewed

@@ -0,0 +1,288 @@
+/**
+ * SherpaOnnx+PcmLiveStream.mm
+ *
+ * Native PCM live capture from the microphone via Audio Queue API (AudioQueueNewInput).
+ * Captures at a supported hardware rate (16000, 44100, 48000), resamples to the requested
+ * target rate, and emits pcmLiveStreamData at target rate (same behavior as Android).
+ */
+#import "SherpaOnnx.h"
+#import <AVFoundation/AVFoundation.h>
+#import <AudioToolbox/AudioToolbox.h>
+#import <React/RCTLog.h>
+#import <stdlib.h>
+static const UInt32 kPcmLiveAQNumberBuffers = 3;
+/** Capture sample rates to try in order (match Android CAPTURE_RATES). */
+static const int kPcmLiveCaptureRates[] = { 16000, 44100, 48000 };
+static const size_t kPcmLiveCaptureRatesCount = sizeof(kPcmLiveCaptureRates) / sizeof(kPcmLiveCaptureRates[0]);
+static NSInteger _pcmLiveTargetSampleRate = 16000;
+static NSInteger _pcmLiveCaptureRate = 16000;
+static __weak SherpaOnnx *_pcmLiveModule = nil;
+static AudioQueueRef _pcmLiveAudioQueue = NULL;
+static AudioQueueBufferRef _pcmLiveAQBuffers[kPcmLiveAQNumberBuffers];
+static volatile BOOL _pcmLiveAQRunning = NO;
+static void emitPcmChunk(SherpaOnnx *module, const int16_t *samples, NSUInteger count, NSInteger sampleRate) {
+  if (!module || count == 0) return;
+  // Copy samples into NSData on the AudioQueue callback thread so the data
+  // remains valid after the audio buffer is reused.
+  NSData *data = [NSData dataWithBytes:samples length:count * sizeof(int16_t)];
+  // Dispatch the React Native event emission to the main queue to avoid
+  // bridge thread-safety issues.
+  dispatch_async(dispatch_get_main_queue(), ^{
+    NSString *base64 = [data base64EncodedStringWithOptions:0];
+    [module sendEventWithName:@"pcmLiveStreamData"
+                        body:@{ @"base64Pcm": base64, @"sampleRate": @(sampleRate) }];
+  });
+}
+static void emitPcmError(SherpaOnnx *module, NSString *message) {
+  if (!module) return;
+  // Dispatch error events to the main queue to match other RN event patterns
+  // and avoid bridge thread-safety issues.
+  dispatch_async(dispatch_get_main_queue(), ^{
+    [module sendEventWithName:@"pcmLiveStreamError" body:@{ @"message": message ?: @"" }];
+  });
+}
+/** Resample Int16 PCM from fromRate to toRate using linear interpolation (match Android resampleInt16). */
+static NSUInteger pcmLiveResampleInt16(const int16_t *input, NSUInteger inputFrames,
+                                      int fromRate, int toRate,
+                                      int16_t *output, size_t outputCapacity) {
+  if (fromRate == toRate) {
+    size_t copy = (inputFrames < outputCapacity) ? inputFrames : outputCapacity;
+    memcpy(output, input, copy * sizeof(int16_t));
+    return copy;
+  }
+  double ratio = (double)fromRate / (double)toRate;
+  NSUInteger outLength = (NSUInteger)((double)inputFrames / ratio);
+  if (outLength > outputCapacity) outLength = outputCapacity;
+  if (outLength == 0) return 0;
+  for (NSUInteger i = 0; i < outLength; i++) {
+    double srcIdx = (double)i * ratio;
+    NSUInteger idx0 = (NSUInteger)srcIdx;
+    if (idx0 >= inputFrames) idx0 = inputFrames - 1;
+    NSUInteger idx1 = idx0 + 1;
+    if (idx1 >= inputFrames) idx1 = inputFrames - 1;
+    float frac = (float)(srcIdx - (double)idx0);
+    int v0 = (int)input[idx0];
+    int v1 = (int)input[idx1];
+    int v = (int)(v0 + (v1 - v0) * frac);
+    if (v < -32768) v = -32768;
+    if (v > 32767) v = 32767;
+    output[i] = (int16_t)v;
+  }
+  return outLength;
+}
+static void pcmLiveAQInputCallback(void *inUserData,
+                                   AudioQueueRef inAQ,
+                                   AudioQueueBufferRef inBuffer,
+                                   const AudioTimeStamp *inStartTime,
+                                   UInt32 inNumPackets,
+                                   const AudioStreamPacketDescription *inPacketDesc) {
+  (void)inUserData;
+  (void)inStartTime;
+  (void)inNumPackets;
+  (void)inPacketDesc;
+  if (!_pcmLiveAQRunning) return;
+  SherpaOnnx *module = _pcmLiveModule;
+  if (!module) return;
+  UInt32 byteSize = inBuffer->mAudioDataByteSize;
+  if (byteSize == 0) {
+    AudioQueueEnqueueBuffer(inAQ, inBuffer, 0, NULL);
+    return;
+  }
+  const int16_t *samples = (const int16_t *)inBuffer->mAudioData;
+  NSUInteger count = byteSize / sizeof(int16_t);
+  NSInteger targetRate = _pcmLiveTargetSampleRate;
+  NSInteger captureRate = _pcmLiveCaptureRate;
+  if (captureRate == targetRate) {
+    emitPcmChunk(module, samples, count, targetRate);
+  } else {
+    // Compute an upper bound on the number of output frames for resampling.
+    NSUInteger maxOutFrames =
+        (count * (NSUInteger)targetRate + (NSUInteger)captureRate - 1) /
+        (NSUInteger)captureRate;
+    if (maxOutFrames == 0) {
+      AudioQueueEnqueueBuffer(inAQ, inBuffer, 0, NULL);
+      return;
+    }
+    int16_t *resampleBuf = (int16_t *)malloc(maxOutFrames * sizeof(int16_t));
+    if (resampleBuf == NULL) {
+      emitPcmError(module, @"Failed to allocate resample buffer");
+      AudioQueueEnqueueBuffer(inAQ, inBuffer, 0, NULL);
+      return;
+    }
+    NSUInteger outFrames = pcmLiveResampleInt16(samples, count,
+                                               (int)captureRate, (int)targetRate,
+                                               resampleBuf, maxOutFrames);
+    if (outFrames > 0)
+      emitPcmChunk(module, resampleBuf, outFrames, targetRate);
+    free(resampleBuf);
+  }
+  AudioQueueEnqueueBuffer(inAQ, inBuffer, 0, NULL);
+}
+static void pcmLiveStopQueue(void) {
+  if (_pcmLiveAudioQueue == NULL) return;
+  _pcmLiveAQRunning = NO;
+  AudioQueueStop(_pcmLiveAudioQueue, true);
+  for (UInt32 i = 0; i < kPcmLiveAQNumberBuffers; i++) {
+    if (_pcmLiveAQBuffers[i] != NULL) {
+      AudioQueueFreeBuffer(_pcmLiveAudioQueue, _pcmLiveAQBuffers[i]);
+      _pcmLiveAQBuffers[i] = NULL;
+    }
+  }
+  AudioQueueDispose(_pcmLiveAudioQueue, true);
+  _pcmLiveAudioQueue = NULL;
+}
+@implementation SherpaOnnx (PcmLiveStream)
+- (void)startPcmLiveStream:(id __unsafe_unretained)optionsArg
+                   resolve:(RCTPromiseResolveBlock)resolve
+                    reject:(RCTPromiseRejectBlock)reject
+{
+  int targetRate = 16000;
+  UInt32 bufferSizeFrames = 0;
+  // Parse optionsArg coming from JS (fallback / non-codegen path).
+  if ([optionsArg isKindOfClass:[NSDictionary class]]) {
+    NSDictionary *dict = (NSDictionary *)optionsArg;
+    id sampleRateValue = dict[@"sampleRate"];
+    if ([sampleRateValue respondsToSelector:@selector(intValue)]) {
+      int v = (int)[sampleRateValue intValue];
+      if (v > 0) targetRate = v;
+    }
+    id bufferSizeValue = dict[@"bufferSizeFrames"];
+    if ([bufferSizeValue respondsToSelector:@selector(doubleValue)]) {
+      double v = [bufferSizeValue doubleValue];
+      if (v > 0) bufferSizeFrames = (UInt32)v;
+    }
+  }
+  [self _startPcmLiveStreamWithTargetRate:targetRate bufferSizeFrames:bufferSizeFrames resolve:resolve reject:reject];
+}
+#if __has_include(<SherpaOnnxSpec/SherpaOnnxSpec.h>)
+- (void)startPcmLiveStreamWithOptions:(JS::NativeSherpaOnnx::SpecStartPcmLiveStreamOptions &)options
+                             resolve:(RCTPromiseResolveBlock)resolve
+                              reject:(RCTPromiseRejectBlock)reject
+{
+  int targetRate = 16000;
+  if (options.sampleRate()) {
+    targetRate = (int)options.sampleRate();
+    if (targetRate <= 0) targetRate = 16000;
+  }
+  UInt32 bufferSizeFrames = 0;
+  if (options.bufferSizeFrames().has_value()) {
+    double v = options.bufferSizeFrames().value();
+    if (v > 0) bufferSizeFrames = (UInt32)v;
+  }
+  [self _startPcmLiveStreamWithTargetRate:targetRate bufferSizeFrames:bufferSizeFrames resolve:resolve reject:reject];
+}
+#endif
+- (void)_startPcmLiveStreamWithTargetRate:(int)targetRate
+                       bufferSizeFrames:(UInt32)bufferSizeFrames
+                                 resolve:(RCTPromiseResolveBlock)resolve
+                                  reject:(RCTPromiseRejectBlock)reject
+{
+  pcmLiveStopQueue();
+  _pcmLiveTargetSampleRate = targetRate;
+  _pcmLiveModule = self;
+  NSError *error = nil;
+  AVAudioSession *session = [AVAudioSession sharedInstance];
+  if (![session setCategory:AVAudioSessionCategoryPlayAndRecord
+                       mode:AVAudioSessionModeDefault
+                    options:AVAudioSessionCategoryOptionDefaultToSpeaker | AVAudioSessionCategoryOptionAllowBluetooth
+                      error:&error]) {
+    RCTLog(@"%@", [NSString stringWithFormat:@"[SherpaOnnx PcmLive] setCategory error: %@", error]);
+    reject(@"PCM_LIVE_STREAM_ERROR", error.localizedDescription ?: @"Failed to set audio session", error);
+    return;
+  }
+  if (![session setActive:YES withOptions:0 error:&error]) {
+    RCTLog(@"%@", [NSString stringWithFormat:@"[SherpaOnnx PcmLive] setActive error: %@", error]);
+    reject(@"PCM_LIVE_STREAM_ERROR", error.localizedDescription ?: @"Failed to activate audio session", error);
+    return;
+  }
+  AudioStreamBasicDescription fmt;
+  memset(&fmt, 0, sizeof(fmt));
+  fmt.mFormatID = kAudioFormatLinearPCM;
+  fmt.mFormatFlags = kLinearPCMFormatFlagIsSignedInteger | kLinearPCMFormatFlagIsPacked;
+  fmt.mChannelsPerFrame = 1;
+  fmt.mBitsPerChannel = 16;
+  fmt.mBytesPerPacket = 2;
+  fmt.mBytesPerFrame = 2;
+  fmt.mFramesPerPacket = 1;
+  OSStatus status = noErr;
+  int chosenCaptureRate = 16000;
+  for (size_t r = 0; r < kPcmLiveCaptureRatesCount; r++) {
+    chosenCaptureRate = kPcmLiveCaptureRates[r];
+    fmt.mSampleRate = (Float64)chosenCaptureRate;
+    status = AudioQueueNewInput(&fmt, pcmLiveAQInputCallback, NULL, NULL, NULL, 0, &_pcmLiveAudioQueue);
+    if (status == noErr) break;
+    _pcmLiveAudioQueue = NULL;
+  }
+  if (status != noErr || _pcmLiveAudioQueue == NULL) {
+    [session setActive:NO withOptions:0 error:nil];
+    reject(@"PCM_LIVE_STREAM_ERROR", [NSString stringWithFormat:@"AudioQueueNewInput failed for all rates (last: %d)", (int)status], nil);
+    return;
+  }
+  _pcmLiveCaptureRate = chosenCaptureRate;
+  UInt32 bufferByteSize = 2048;
+  if (bufferSizeFrames > 0) {
+    bufferByteSize = bufferSizeFrames * 2;  /* 16-bit mono */
+    if (bufferByteSize < 1024) bufferByteSize = 1024;
+    if (bufferByteSize > 32768) bufferByteSize = 32768;
+  }
+  for (UInt32 i = 0; i < kPcmLiveAQNumberBuffers; i++) {
+    status = AudioQueueAllocateBuffer(_pcmLiveAudioQueue, bufferByteSize, &_pcmLiveAQBuffers[i]);
+    if (status != noErr) {
+      pcmLiveStopQueue();
+      [session setActive:NO withOptions:0 error:nil];
+      reject(@"PCM_LIVE_STREAM_ERROR", [NSString stringWithFormat:@"AudioQueueAllocateBuffer failed: %d", (int)status], nil);
+      return;
+    }
+    AudioQueueEnqueueBuffer(_pcmLiveAudioQueue, _pcmLiveAQBuffers[i], 0, NULL);
+  }
+  _pcmLiveAQRunning = YES;
+  status = AudioQueueStart(_pcmLiveAudioQueue, NULL);
+  if (status != noErr) {
+    pcmLiveStopQueue();
+    [session setActive:NO withOptions:0 error:nil];
+    reject(@"PCM_LIVE_STREAM_ERROR", [NSString stringWithFormat:@"AudioQueueStart failed: %d", (int)status], nil);
+    return;
+  }
+  resolve(nil);
+}
+- (void)stopPcmLiveStream:(RCTPromiseResolveBlock)resolve
+                   reject:(RCTPromiseRejectBlock)reject
+{
+  [self stopPcmLiveStreamWithResolve:resolve reject:reject];
+}
+- (void)stopPcmLiveStreamWithResolve:(RCTPromiseResolveBlock)resolve
+                             reject:(RCTPromiseRejectBlock)reject
+{
+  pcmLiveStopQueue();
+  [[AVAudioSession sharedInstance] setActive:NO withOptions:AVAudioSessionSetActiveOptionNotifyOthersOnDeactivation error:nil];
+  resolve(nil);
+}
+@end

package/ios/SherpaOnnx+STT.mm CHANGED Viewed

@@ -38,6 +38,7 @@ static NSString *sttModelKindToNSString(sherpaonnx::SttModelKind kind) {
         case K::kFunAsrNano: return @"funasr_nano";
         case K::kFireRedAsr: return @"fire_red_asr";
         case K::kMoonshine: return @"moonshine";
+        case K::kMoonshineV2: return @"moonshine_v2";
         case K::kDolphin: return @"dolphin";
         case K::kCanary: return @"canary";
         case K::kOmnilingual: return @"omnilingual";
@@ -268,6 +269,7 @@ static NSDictionary *sttResultToDict(const sherpaonnx::SttRecognitionResult& r)
         NSMutableDictionary *resultDict = [NSMutableDictionary dictionary];
         resultDict[@"success"] = @(result.ok);
+        resultDict[@"isHardwareSpecificUnsupported"] = @(result.isHardwareSpecificUnsupported);
         if (!result.error.empty()) {
             resultDict[@"error"] = [NSString stringWithUTF8String:result.error.c_str()];
         }

package/ios/SherpaOnnx+TTS.mm CHANGED Viewed

@@ -232,6 +232,13 @@ std::vector<std::string> SplitTtsTokens(const std::string &text) {
         }
         resultDict[@"detectedModels"] = detectedModelsArray;
         resultDict[@"modelType"] = ttsModelKindToNSString(result.selectedKind);
+        if (!result.lexiconLanguageCandidates.empty()) {
+            NSMutableArray *langCandidates = [NSMutableArray array];
+            for (const auto& id : result.lexiconLanguageCandidates) {
+                [langCandidates addObject:[NSString stringWithUTF8String:id.c_str()]];
+            }
+            resultDict[@"lexiconLanguageCandidates"] = langCandidates;
+        }
         resolve(resultDict);
     } @catch (NSException *exception) {
         NSString *errorMsg = [NSString stringWithFormat:@"TTS model detection failed: %@", exception.reason];
@@ -1041,6 +1048,16 @@ std::vector<std::string> SplitTtsTokens(const std::string &text) {
     }
 }
+- (void)copyFileToContentUri:(NSString *)filePath
+              directoryUri:(NSString *)directoryUri
+                  filename:(NSString *)filename
+                  mimeType:(NSString *)mimeType
+                   resolve:(RCTPromiseResolveBlock)resolve
+                    reject:(RCTPromiseRejectBlock)reject
+{
+    reject(@"TTS_SAVE_ERROR", @"Copy file to content URI is not supported on iOS (Android SAF only)", nil);
+}
 - (void)saveTtsTextToContentUri:(NSString *)text
                  directoryUri:(NSString *)directoryUri
                      filename:(NSString *)filename

package/ios/SherpaOnnx.mm CHANGED Viewed

@@ -11,6 +11,8 @@
 #import "SherpaOnnx+Assets.h"
 #import "sherpa-onnx-archive-helper.h"
 #import <React/RCTLog.h>
+#import <AVFoundation/AVFoundation.h>
+#import "SherpaOnnxAudioConvert.h"
 #if __has_include("SherpaOnnx-Swift.h")
 #import "SherpaOnnx-Swift.h"
 #endif
@@ -36,7 +38,7 @@
 - (NSArray<NSString *> *)supportedEvents
 {
-    return @[ @"ttsStreamChunk", @"ttsStreamEnd", @"ttsStreamError", @"extractTarBz2Progress" ];
+    return @[ @"ttsStreamChunk", @"ttsStreamEnd", @"ttsStreamError", @"extractTarBz2Progress", @"pcmLiveStreamData", @"pcmLiveStreamError" ];
 }
 - (void)resolveModelPath:(JS::NativeSherpaOnnx::SpecResolveModelPathConfig &)config
@@ -93,6 +95,12 @@
     resolve(@{ @"providerCompiled": @NO, @"hasAccelerator": @NO, @"canInit": @NO });
 }
+- (void)getDeviceQnnSoc:(RCTPromiseResolveBlock)resolve
+                  reject:(RCTPromiseRejectBlock)reject
+{
+    resolve(@{ @"soc": [NSNull null], @"isSupported": @NO });
+}
 // NNAPI is Android-only; on iOS we always return no support.
 - (void)getNnapiSupport:(NSString *)modelBase64
                 resolve:(RCTPromiseResolveBlock)resolve
@@ -183,7 +191,16 @@
                     resolve:(RCTPromiseResolveBlock)resolve
                      reject:(RCTPromiseRejectBlock)reject
 {
-    reject(@"UNSUPPORTED", @"convertAudioToFormat is not implemented on iOS", nil);
+    NSError *error = nil;
+    if (![SherpaOnnxAudioConvert convertAudioToFormat:inputPath
+                                           outputPath:outputPath
+                                               format:format
+                                   outputSampleRateHz:outputSampleRateHz.intValue
+                                                error:&error]) {
+        reject(@"CONVERT_ERROR", error ? error.localizedDescription : @"Conversion failed", error);
+        return;
+    }
+    resolve(nil);
 }
 - (void)convertAudioToWav16k:(NSString *)inputPath
@@ -191,7 +208,14 @@
                     resolve:(RCTPromiseResolveBlock)resolve
                      reject:(RCTPromiseRejectBlock)reject
 {
-    reject(@"UNSUPPORTED", @"convertAudioToWav16k is not implemented on iOS", nil);
+    NSError *error = nil;
+    if (![SherpaOnnxAudioConvert convertAudioToWav16k:inputPath
+                                           outputPath:outputPath
+                                                error:&error]) {
+        reject(@"CONVERT_ERROR", error ? error.localizedDescription : @"Conversion to WAV 16kHz mono failed", error);
+        return;
+    }
+    resolve(nil);
 }
 - (void)getAvailableProviders:(RCTPromiseResolveBlock)resolve

package/ios/SherpaOnnxAudioConvert.h ADDED Viewed

@@ -0,0 +1,28 @@
+#import <Foundation/Foundation.h>
+NS_ASSUME_NONNULL_BEGIN
+@interface SherpaOnnxAudioConvert : NSObject
+/**
+ * Converts any supported audio file to 16 kHz mono 16-bit PCM WAV.
+ * Returns YES on success, NO on failure. Populates `error` on failure.
+ */
++ (BOOL)convertAudioToWav16k:(NSString *)inputPath
+                  outputPath:(NSString *)outputPath
+                       error:(NSError **)error;
+/**
+ * Converts arbitrary audio file to requested format (e.g. "mp3", "flac", "wav").
+ * outputSampleRateHz is mostly used for MP3 encoding.
+ * Returns YES on success, NO on failure. Populates `error` on failure.
+ */
++ (BOOL)convertAudioToFormat:(NSString *)inputPath
+                  outputPath:(NSString *)outputPath
+                      format:(NSString *)format
+          outputSampleRateHz:(int)outputSampleRateHz
+                       error:(NSError **)error;
+@end
+NS_ASSUME_NONNULL_END