npm - react-native-audio-api - Versions diffs - 0.9.0 → 0.10.0-nightly-971a6b4-20251010 - Mend

react-native-audio-api 0.9.0 → 0.10.0-nightly-971a6b4-20251010

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (60) hide show

package/android/src/main/cpp/audioapi/android/core/{AudioDecoder.cpp → utils/AudioDecoder.cpp} +79 -75
package/common/cpp/audioapi/AudioAPIModuleInstaller.h +124 -43
package/common/cpp/audioapi/HostObjects/BaseAudioContextHostObject.cpp +1 -101
package/common/cpp/audioapi/HostObjects/BaseAudioContextHostObject.h +0 -3
package/common/cpp/audioapi/HostObjects/utils/AudioDecoderHostObject.cpp +133 -0
package/common/cpp/audioapi/HostObjects/utils/AudioDecoderHostObject.h +28 -0
package/common/cpp/audioapi/HostObjects/utils/AudioStretcherHostObject.cpp +58 -0
package/common/cpp/audioapi/HostObjects/utils/AudioStretcherHostObject.h +26 -0
package/common/cpp/audioapi/core/AudioContext.cpp +0 -2
package/common/cpp/audioapi/core/BaseAudioContext.cpp +0 -35
package/common/cpp/audioapi/core/BaseAudioContext.h +4 -12
package/common/cpp/audioapi/core/OfflineAudioContext.cpp +0 -2
package/common/cpp/audioapi/core/sources/AudioBufferBaseSourceNode.cpp +0 -4
package/common/cpp/audioapi/core/sources/AudioBufferBaseSourceNode.h +0 -1
package/common/cpp/audioapi/core/sources/AudioBufferSourceNode.cpp +0 -2
package/common/cpp/audioapi/core/sources/AudioScheduledSourceNode.cpp +0 -4
package/common/cpp/audioapi/core/sources/AudioScheduledSourceNode.h +0 -1
package/common/cpp/audioapi/core/types/AudioFormat.h +16 -0
package/common/cpp/audioapi/core/utils/AudioDecoder.h +36 -91
package/common/cpp/audioapi/core/utils/AudioStretcher.cpp +75 -0
package/common/cpp/audioapi/core/utils/AudioStretcher.h +30 -0
package/common/cpp/audioapi/core/utils/Constants.h +4 -0
package/common/cpp/audioapi/events/AudioEventHandlerRegistry.cpp +5 -1
package/common/cpp/audioapi/libs/ffmpeg/FFmpegDecoding.cpp +241 -282
package/common/cpp/audioapi/libs/ffmpeg/FFmpegDecoding.h +57 -19
package/common/cpp/test/CMakeLists.txt +1 -1
package/ios/audioapi/ios/core/utils/AudioDecoder.mm +160 -0
package/lib/commonjs/api.js +21 -1
package/lib/commonjs/api.js.map +1 -1
package/lib/commonjs/core/AudioDecoder.js +48 -0
package/lib/commonjs/core/AudioDecoder.js.map +1 -0
package/lib/commonjs/core/AudioStretcher.js +31 -0
package/lib/commonjs/core/AudioStretcher.js.map +1 -0
package/lib/commonjs/core/BaseAudioContext.js +11 -18
package/lib/commonjs/core/BaseAudioContext.js.map +1 -1
package/lib/module/api.js +3 -1
package/lib/module/api.js.map +1 -1
package/lib/module/core/AudioDecoder.js +42 -0
package/lib/module/core/AudioDecoder.js.map +1 -0
package/lib/module/core/AudioStretcher.js +26 -0
package/lib/module/core/AudioStretcher.js.map +1 -0
package/lib/module/core/BaseAudioContext.js +11 -18
package/lib/module/core/BaseAudioContext.js.map +1 -1
package/lib/typescript/api.d.ts +5 -1
package/lib/typescript/api.d.ts.map +1 -1
package/lib/typescript/core/AudioDecoder.d.ts +4 -0
package/lib/typescript/core/AudioDecoder.d.ts.map +1 -0
package/lib/typescript/core/AudioStretcher.d.ts +3 -0
package/lib/typescript/core/AudioStretcher.d.ts.map +1 -0
package/lib/typescript/core/BaseAudioContext.d.ts +3 -6
package/lib/typescript/core/BaseAudioContext.d.ts.map +1 -1
package/lib/typescript/interfaces.d.ts +10 -3
package/lib/typescript/interfaces.d.ts.map +1 -1
package/package.json +1 -1
package/src/api.ts +10 -0
package/src/core/AudioDecoder.ts +78 -0
package/src/core/AudioStretcher.ts +43 -0
package/src/core/BaseAudioContext.ts +26 -29
package/src/interfaces.ts +26 -6
package/ios/audioapi/ios/core/AudioDecoder.mm +0 -156

package/common/cpp/audioapi/libs/ffmpeg/FFmpegDecoding.cpp CHANGED Viewed

@@ -1,16 +1,20 @@
 /*
- * This file dynamically links to the FFmpeg library, which is licensed under the
- * GNU Lesser General Public License (LGPL) version 2.1 or later.
+ * This file dynamically links to the FFmpeg library, which is licensed under
+ * the GNU Lesser General Public License (LGPL) version 2.1 or later.
  *
- * Our own code in this file is licensed under the MIT License and dynamic linking
- * allows you to use this code without your entire project being subject to the
- * terms of the LGPL. However, note that if you link statically to FFmpeg, you must
- * comply with the terms of the LGPL for FFmpeg itself.
+ * Our own code in this file is licensed under the MIT License and dynamic
+ * linking allows you to use this code without your entire project being subject
+ * to the terms of the LGPL. However, note that if you link statically to
+ * FFmpeg, you must comply with the terms of the LGPL for FFmpeg itself.
  */
-#include "FFmpegDecoding.h"
+#include <audioapi/core/sources/AudioBuffer.h>
+#include <audioapi/libs/ffmpeg/FFmpegDecoding.h>
+#include <audioapi/utils/AudioArray.h>
+#include <audioapi/utils/AudioBus.h>
+#include <functional>
-namespace audioapi::ffmpegdecoding {
+namespace audioapi::ffmpegdecoder {
 int read_packet(void *opaque, uint8_t *buf, int buf_size) {
   MemoryIOContext *ctx = static_cast<MemoryIOContext *>(opaque);
@@ -51,42 +55,87 @@ int64_t seek_packet(void *opaque, int64_t offset, int whence) {
   return ctx->pos;
 }
-std::vector<int16_t> readAllPcmFrames(
+void convertFrameToBuffer(
+    SwrContext *swr,
+    AVFrame *frame,
+    int output_channel_count,
+    std::vector<float> &buffer,
+    size_t &framesRead,
+    uint8_t **&resampled_data,
+    int &max_resampled_samples) {
+  const int out_samples = swr_get_out_samples(swr, frame->nb_samples);
+  if (out_samples > max_resampled_samples) {
+    av_freep(&resampled_data[0]);
+    av_freep(&resampled_data);
+    max_resampled_samples = out_samples;
+    if (av_samples_alloc_array_and_samples(
+            &resampled_data,
+            nullptr,
+            output_channel_count,
+            max_resampled_samples,
+            AV_SAMPLE_FMT_FLT,
+            0) < 0) {
+      return;
+    }
+  }
+  int converted_samples = swr_convert(
+      swr,
+      resampled_data,
+      max_resampled_samples,
+      const_cast<const uint8_t **>(frame->data),
+      frame->nb_samples);
+  if (converted_samples > 0) {
+    const size_t current_size = buffer.size();
+    const size_t new_samples =
+        static_cast<size_t>(converted_samples) * output_channel_count;
+    buffer.resize(current_size + new_samples);
+    memcpy(
+        buffer.data() + current_size,
+        resampled_data[0],
+        new_samples * sizeof(float));
+    framesRead += converted_samples;
+  }
+}
+std::vector<float> readAllPcmFrames(
     AVFormatContext *fmt_ctx,
     AVCodecContext *codec_ctx,
     int out_sample_rate,
+    int output_channel_count,
     int audio_stream_index,
-    int channels,
     size_t &framesRead) {
-  std::vector<int16_t> buffer;
-  SwrContext *swr_ctx = swr_alloc();
-  if (swr_ctx == nullptr) {
+  framesRead = 0;
+  std::vector<float> buffer;
+  auto swr = std::unique_ptr<SwrContext, std::function<void(SwrContext *)>>(
+      swr_alloc(), [](SwrContext *ctx) { swr_free(&ctx); });
+  if (swr == nullptr)
     return buffer;
-  }
-  av_opt_set_chlayout(swr_ctx, "in_chlayout", &codec_ctx->ch_layout, 0);
-  av_opt_set_int(swr_ctx, "in_sample_rate", codec_ctx->sample_rate, 0);
-  av_opt_set_sample_fmt(swr_ctx, "in_sample_fmt", codec_ctx->sample_fmt, 0);
+  av_opt_set_chlayout(swr.get(), "in_chlayout", &codec_ctx->ch_layout, 0);
+  av_opt_set_int(swr.get(), "in_sample_rate", codec_ctx->sample_rate, 0);
+  av_opt_set_sample_fmt(swr.get(), "in_sample_fmt", codec_ctx->sample_fmt, 0);
   AVChannelLayout out_ch_layout;
-  av_channel_layout_default(&out_ch_layout, channels);
-  av_opt_set_chlayout(swr_ctx, "out_chlayout", &out_ch_layout, 0);
-  av_opt_set_int(swr_ctx, "out_sample_rate", out_sample_rate, 0);
-  av_opt_set_sample_fmt(swr_ctx, "out_sample_fmt", AV_SAMPLE_FMT_S16, 0);
+  av_channel_layout_default(&out_ch_layout, output_channel_count);
+  av_opt_set_chlayout(swr.get(), "out_chlayout", &out_ch_layout, 0);
+  av_opt_set_int(swr.get(), "out_sample_rate", out_sample_rate, 0);
+  av_opt_set_sample_fmt(swr.get(), "out_sample_fmt", AV_SAMPLE_FMT_FLT, 0);
-  if (swr_init(swr_ctx) < 0) {
-    swr_free(&swr_ctx);
+  if (swr_init(swr.get()) < 0) {
     av_channel_layout_uninit(&out_ch_layout);
     return buffer;
   }
-  AVPacket *packet = av_packet_alloc();
-  AVFrame *frame = av_frame_alloc();
+  auto packet = std::unique_ptr<AVPacket, std::function<void(AVPacket *)>>(
+      av_packet_alloc(), [](AVPacket *p) { av_packet_free(&p); });
+  auto frame = std::unique_ptr<AVFrame, std::function<void(AVFrame *)>>(
+      av_frame_alloc(), [](AVFrame *p) { av_frame_free(&p); });
   if (packet == nullptr || frame == nullptr) {
-    if (packet != nullptr) av_packet_free(&packet);
-    if (frame != nullptr) av_frame_free(&frame);
-    swr_free(&swr_ctx);
     av_channel_layout_uninit(&out_ch_layout);
     return buffer;
   }
@@ -94,312 +143,222 @@ std::vector<int16_t> readAllPcmFrames(
   // Allocate buffer for resampled data
   uint8_t **resampled_data = nullptr;
   int max_resampled_samples = 4096; // Initial size
-  int ret = av_samples_alloc_array_and_samples(
-      &resampled_data,
-      nullptr,
-      channels,
-      max_resampled_samples,
-      AV_SAMPLE_FMT_S16,
-      0);
-  if (ret < 0) {
-    av_frame_free(&frame);
-    av_packet_free(&packet);
-    swr_free(&swr_ctx);
+  if (av_samples_alloc_array_and_samples(
+          &resampled_data,
+          nullptr,
+          output_channel_count,
+          max_resampled_samples,
+          AV_SAMPLE_FMT_FLT,
+          0) < 0) {
     av_channel_layout_uninit(&out_ch_layout);
     return buffer;
   }
-  framesRead = 0;
-  while (av_read_frame(fmt_ctx, packet) >= 0) {
+  while (av_read_frame(fmt_ctx, packet.get()) >= 0) {
     if (packet->stream_index == audio_stream_index) {
-      if (avcodec_send_packet(codec_ctx, packet) == 0) {
-        while (avcodec_receive_frame(codec_ctx, frame) == 0) {
-          // Check if we need more buffer space
-          int out_samples = swr_get_out_samples(swr_ctx, frame->nb_samples);
-          if (out_samples > max_resampled_samples) {
-            if (resampled_data != nullptr) {
-              av_freep(&resampled_data[0]);
-              av_freep(&resampled_data);
-            }
-            max_resampled_samples = out_samples;
-            ret = av_samples_alloc_array_and_samples(
-                &resampled_data,
-                nullptr,
-                channels,
-                max_resampled_samples,
-                AV_SAMPLE_FMT_S16,
-                0);
-            if (ret < 0) {
-              break; // Exit on allocation failure
-            }
-          }
-          int converted_samples = swr_convert(
-              swr_ctx,
+      if (avcodec_send_packet(codec_ctx, packet.get()) == 0) {
+        while (avcodec_receive_frame(codec_ctx, frame.get()) == 0) {
+          convertFrameToBuffer(
+              swr.get(),
+              frame.get(),
+              output_channel_count,
+              buffer,
+              framesRead,
               resampled_data,
-              max_resampled_samples,
-              (const uint8_t **)frame->data,
-              frame->nb_samples);
-          if (converted_samples > 0) {
-            size_t current_size = buffer.size();
-            size_t new_samples = converted_samples * channels;
-            buffer.resize(current_size + new_samples);
-            memcpy(
-                buffer.data() + current_size,
-                resampled_data[0],
-                new_samples * sizeof(int16_t));
-            framesRead += converted_samples;
-          }
+              max_resampled_samples);
         }
       }
     }
-    av_packet_unref(packet);
+    av_packet_unref(packet.get());
   }
   // Flush decoder
   avcodec_send_packet(codec_ctx, nullptr);
-  while (avcodec_receive_frame(codec_ctx, frame) == 0) {
-    int out_samples = swr_get_out_samples(swr_ctx, frame->nb_samples);
-    if (out_samples > max_resampled_samples) {
-      if (resampled_data != nullptr) {
-        av_freep(&resampled_data[0]);
-        av_freep(&resampled_data);
-      }
-      max_resampled_samples = out_samples;
-      ret = av_samples_alloc_array_and_samples(
-          &resampled_data,
-          nullptr,
-          channels,
-          max_resampled_samples,
-          AV_SAMPLE_FMT_S16,
-          0);
-      if (ret < 0) {
-        break;
-      }
-    }
-    int converted_samples = swr_convert(
-        swr_ctx,
+  while (avcodec_receive_frame(codec_ctx, frame.get()) == 0) {
+    convertFrameToBuffer(
+        swr.get(),
+        frame.get(),
+        output_channel_count,
+        buffer,
+        framesRead,
         resampled_data,
-        max_resampled_samples,
-        (const uint8_t **)frame->data,
-        frame->nb_samples);
-    if (converted_samples > 0) {
-      size_t current_size = buffer.size();
-      size_t new_samples = converted_samples * channels;
-      buffer.resize(current_size + new_samples);
-      memcpy(
-          buffer.data() + current_size,
-          resampled_data[0],
-          new_samples * sizeof(int16_t));
-      framesRead += converted_samples;
-    }
+        max_resampled_samples);
   }
-  if (resampled_data != nullptr) {
-    av_freep(&resampled_data[0]);
-    av_freep(&resampled_data);
-  }
-  swr_free(&swr_ctx);
+  av_freep(&resampled_data[0]);
+  av_freep(&resampled_data);
   av_channel_layout_uninit(&out_ch_layout);
-  av_frame_free(&frame);
-  av_packet_free(&packet);
   return buffer;
 }
-std::vector<int16_t> decodeWithMemoryBlock(const void *data, size_t size, const int channel_count, int sample_rate) {
-    if (data == nullptr || size == 0) {
-        return {};
-    }
-    MemoryIOContext io_ctx;
-    io_ctx.data = static_cast<const uint8_t *>(data);
-    io_ctx.size = size;
-    io_ctx.pos = 0;
-    constexpr size_t buffer_size = 4096;
-    uint8_t *io_buffer = static_cast<uint8_t *>(av_malloc(buffer_size));
-    if (io_buffer == nullptr) {
-        return {};
+inline int findAudioStreamIndex(AVFormatContext *fmt_ctx) {
+  for (int i = 0; i < fmt_ctx->nb_streams; i++) {
+    if (fmt_ctx->streams[i]->codecpar->codec_type == AVMEDIA_TYPE_AUDIO) {
+      return i;
     }
+  }
+  return -1;
+}
-    AVIOContext *avio_ctx = avio_alloc_context(
-        io_buffer, buffer_size, 0, &io_ctx, read_packet, nullptr, seek_packet);
-    if (avio_ctx == nullptr) {
-      av_free(io_buffer);
-      return {};
-    }
+bool setupDecoderContext(
+    AVFormatContext *fmt_ctx,
+    int &audio_stream_index,
+    std::unique_ptr<AVCodecContext, std::function<void(AVCodecContext *)>>
+        &codec_ctx) {
+  audio_stream_index = findAudioStreamIndex(fmt_ctx);
+  if (audio_stream_index == -1) {
+    return false;
+  }
-    // Create format context and set custom IO
-    AVFormatContext *fmt_ctx = avformat_alloc_context();
-    if (fmt_ctx == nullptr) {
-      avio_context_free(&avio_ctx);
-      return {};
-    }
-    fmt_ctx->pb = avio_ctx;
-    // Open input from memory
-    if (avformat_open_input(&fmt_ctx, nullptr, nullptr, nullptr) < 0) {
-      avformat_free_context(fmt_ctx);
-      avio_context_free(&avio_ctx);
-      return {};
-    }
+  AVCodecParameters *codecpar = fmt_ctx->streams[audio_stream_index]->codecpar;
+  const AVCodec *codec = avcodec_find_decoder(codecpar->codec_id);
+  if (codec == nullptr) {
+    return false;
+  }
-    // Find stream info
-    if (avformat_find_stream_info(fmt_ctx, nullptr) < 0) {
-      avformat_close_input(&fmt_ctx);
-      avio_context_free(&avio_ctx);
-      return {};
-    }
+  AVCodecContext *raw_codec_ctx = avcodec_alloc_context3(codec);
+  if (raw_codec_ctx == nullptr) {
+    return false;
+  }
-    int audio_stream_index = -1;
-    for (int i = 0; i < fmt_ctx->nb_streams; i++) {
-      if (fmt_ctx->streams[i]->codecpar->codec_type == AVMEDIA_TYPE_AUDIO) {
-        audio_stream_index = i;
-        break;
-      }
-    }
+  codec_ctx.reset(raw_codec_ctx);
+  if (avcodec_parameters_to_context(codec_ctx.get(), codecpar) < 0) {
+    return false;
+  }
+  if (avcodec_open2(codec_ctx.get(), codec, nullptr) < 0) {
+    return false;
+  }
-    if (audio_stream_index == -1) {
-      avformat_close_input(&fmt_ctx);
-      avio_context_free(&avio_ctx);
-      return {};
-    }
+  return true;
+}
-    AVCodecParameters *codecpar = fmt_ctx->streams[audio_stream_index]->codecpar;
+std::shared_ptr<AudioBuffer> decodeAudioFrames(
+    AVFormatContext *fmt_ctx,
+    AVCodecContext *codec_ctx,
+    int audio_stream_index,
+    int sample_rate) {
+  size_t framesRead = 0;
+  int output_sample_rate =
+      (sample_rate > 0) ? sample_rate : codec_ctx->sample_rate;
+  int output_channel_count = codec_ctx->ch_layout.nb_channels;
+  std::vector<float> decoded_buffer = readAllPcmFrames(
+      fmt_ctx,
+      codec_ctx,
+      output_sample_rate,
+      output_channel_count,
+      audio_stream_index,
+      framesRead);
-    // Find decoder
-    const AVCodec *codec = avcodec_find_decoder(codecpar->codec_id);
-    if (codec == nullptr) {
-      avformat_close_input(&fmt_ctx);
-      avio_context_free(&avio_ctx);
-      return {};
-    }
+  if (framesRead == 0 || decoded_buffer.empty()) {
+    return nullptr;
+  }
-    // Allocate and setup codec context
-    AVCodecContext *codec_ctx = avcodec_alloc_context3(codec);
-    if (codec_ctx == nullptr) {
-      avformat_close_input(&fmt_ctx);
-      avio_context_free(&avio_ctx);
-      return {};
-    }
+  auto outputFrames = decoded_buffer.size() / output_channel_count;
+  auto audioBus = std::make_shared<AudioBus>(
+      outputFrames, output_channel_count, output_sample_rate);
-    if (avcodec_parameters_to_context(codec_ctx, codecpar) < 0) {
-      avcodec_free_context(&codec_ctx);
-      avformat_close_input(&fmt_ctx);
-      avio_context_free(&avio_ctx);
-      return {};
+  for (int ch = 0; ch < output_channel_count; ++ch) {
+    auto channelData = audioBus->getChannel(ch)->getData();
+    for (int i = 0; i < outputFrames; ++i) {
+      channelData[i] = decoded_buffer[i * output_channel_count + ch];
     }
+  }
+  return std::make_shared<AudioBuffer>(audioBus);
+}
-    if (avcodec_open2(codec_ctx, codec, nullptr) < 0) {
-      avcodec_free_context(&codec_ctx);
-      avformat_close_input(&fmt_ctx);
-      avio_context_free(&avio_ctx);
-      return {};
-    }
+std::shared_ptr<AudioBuffer>
+decodeWithMemoryBlock(const void *data, size_t size, int sample_rate) {
+  if (data == nullptr || size == 0) {
+    return nullptr;
+  }
-    // Get actual channel count from the decoded stream
-    int actual_channels = codec_ctx->ch_layout.nb_channels;
+  MemoryIOContext io_ctx{static_cast<const uint8_t *>(data), size, 0};
-    // Validate channel count
-    if (actual_channels <= 0 || actual_channels > 8) {
-      avcodec_free_context(&codec_ctx);
-      avformat_close_input(&fmt_ctx);
-      avio_context_free(&avio_ctx);
-      return {};
-    }
+  constexpr size_t buffer_size = 4096;
+  auto io_buffer = std::unique_ptr<uint8_t, decltype(&av_free)>(
+      static_cast<uint8_t *>(av_malloc(buffer_size)), &av_free);
+  if (io_buffer == nullptr) {
+    return nullptr;
+  }
-    // Decode all frames
-    size_t framesRead = 0;
-    std::vector<int16_t> decoded_buffer = readAllPcmFrames(
-        fmt_ctx, codec_ctx, sample_rate, audio_stream_index, channel_count, framesRead);
+  auto avio_ctx =
+      std::unique_ptr<AVIOContext, std::function<void(AVIOContext *)>>(
+          avio_alloc_context(
+              io_buffer.get(),
+              buffer_size,
+              0,
+              &io_ctx,
+              read_packet,
+              nullptr,
+              seek_packet),
+          [](AVIOContext *ctx) { avio_context_free(&ctx); });
+  if (avio_ctx == nullptr) {
+    return nullptr;
+  }
-    // Cleanup - Note: avio_context_free will free the io_buffer
-    avcodec_free_context(&codec_ctx);
-    avformat_close_input(&fmt_ctx);
-    avio_context_free(&avio_ctx);
+  AVFormatContext *raw_fmt_ctx = avformat_alloc_context();
+  if (raw_fmt_ctx == nullptr) {
+    return nullptr;
+  }
+  raw_fmt_ctx->pb = avio_ctx.get();
-    if (framesRead == 0 || decoded_buffer.empty()) {
-      return {};
-    }
+  if (avformat_open_input(&raw_fmt_ctx, nullptr, nullptr, nullptr) < 0) {
+    avformat_free_context(raw_fmt_ctx);
+    return nullptr;
+  }
-    return decoded_buffer;
-}
+  auto fmt_ctx =
+      std::unique_ptr<AVFormatContext, decltype(&avformat_free_context)>(
+          raw_fmt_ctx, &avformat_free_context);
-std::vector<int16_t> decodeWithFilePath(const std::string &path, const int channel_count, int sample_rate) {
-  if (path.empty()) {
-      return {};
+  if (avformat_find_stream_info(fmt_ctx.get(), nullptr) < 0) {
+    return nullptr;
   }
-  AVFormatContext *fmt_ctx = nullptr;
-  if (avformat_open_input(&fmt_ctx, path.c_str(), nullptr, nullptr) < 0) {
-      return {};
-  }
-  if (avformat_find_stream_info(fmt_ctx, nullptr) < 0) {
-      avformat_close_input(&fmt_ctx);
-      return {};
-  }
+  auto codec_ctx =
+      std::unique_ptr<AVCodecContext, std::function<void(AVCodecContext *)>>(
+          nullptr, [](AVCodecContext *ctx) { avcodec_free_context(&ctx); });
   int audio_stream_index = -1;
-  for (int i = 0; i < fmt_ctx->nb_streams; i++) {
-      if (fmt_ctx->streams[i]->codecpar->codec_type == AVMEDIA_TYPE_AUDIO) {
-          audio_stream_index = i;
-          break;
-      }
-  }
-  if (audio_stream_index == -1) {
-      avformat_close_input(&fmt_ctx);
-      return {};
+  if (!setupDecoderContext(fmt_ctx.get(), audio_stream_index, codec_ctx)) {
+    return nullptr;
   }
-  AVCodecParameters *codecpar = fmt_ctx->streams[audio_stream_index]->codecpar;
-  const AVCodec *codec = avcodec_find_decoder(codecpar->codec_id);
-  if (codec == nullptr) {
-      avformat_close_input(&fmt_ctx);
-      return {};
-  }
-  AVCodecContext *codec_ctx = avcodec_alloc_context3(codec);
-  if (codec_ctx == nullptr) {
-      avformat_close_input(&fmt_ctx);
-      return {};
-  }
+  return decodeAudioFrames(
+      fmt_ctx.get(), codec_ctx.get(), audio_stream_index, sample_rate);
+}
-  if (avcodec_parameters_to_context(codec_ctx, codecpar) < 0) {
-      avcodec_free_context(&codec_ctx);
-      avformat_close_input(&fmt_ctx);
-      return {};
+std::shared_ptr<AudioBuffer> decodeWithFilePath(
+    const std::string &path,
+    int sample_rate) {
+  if (path.empty()) {
+    return nullptr;
   }
-  if (avcodec_open2(codec_ctx, codec, nullptr) < 0) {
-      avcodec_free_context(&codec_ctx);
-      avformat_close_input(&fmt_ctx);
-      return {};
-  }
+  AVFormatContext *raw_fmt_ctx = nullptr;
+  if (avformat_open_input(&raw_fmt_ctx, path.c_str(), nullptr, nullptr) < 0)
+    return nullptr;
-  size_t framesRead = 0;
-  std::vector<int16_t> decoded_buffer = readAllPcmFrames(
-      fmt_ctx, codec_ctx, sample_rate, audio_stream_index, channel_count, framesRead);
+  auto fmt_ctx =
+      std::unique_ptr<AVFormatContext, std::function<void(AVFormatContext *)>>(
+          raw_fmt_ctx,
+          [](AVFormatContext *ctx) { avformat_close_input(&ctx); });
-  avcodec_free_context(&codec_ctx);
-  avformat_close_input(&fmt_ctx);
+  if (avformat_find_stream_info(fmt_ctx.get(), nullptr) < 0) {
+    return nullptr;
+  }
-  if (framesRead == 0 || decoded_buffer.empty()) {
-      return {};
+  auto codec_ctx =
+      std::unique_ptr<AVCodecContext, std::function<void(AVCodecContext *)>>(
+          nullptr, [](AVCodecContext *ctx) { avcodec_free_context(&ctx); });
+  int audio_stream_index = -1;
+  if (!setupDecoderContext(fmt_ctx.get(), audio_stream_index, codec_ctx)) {
+    return nullptr;
   }
-  return decoded_buffer;
+  return decodeAudioFrames(
+      fmt_ctx.get(), codec_ctx.get(), audio_stream_index, sample_rate);
 }
 } // namespace audioapi::ffmpegdecoder