npm - react-native-audio-concat - Versions diffs - 0.3.0 → 0.5.0 - Mend

react-native-audio-concat 0.3.0 → 0.5.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (2) hide show

package/android/src/main/java/com/audioconcat/AudioConcatModule.kt +944 -48
package/package.json +1 -1

package/android/src/main/java/com/audioconcat/AudioConcatModule.kt CHANGED Viewed

@@ -13,6 +13,12 @@ import android.media.MediaMuxer
 import java.io.File
 import java.nio.ByteBuffer
 import android.util.Log
+import java.util.concurrent.Executors
+import java.util.concurrent.BlockingQueue
+import java.util.concurrent.LinkedBlockingQueue
+import java.util.concurrent.CountDownLatch
+import java.util.concurrent.atomic.AtomicInteger
+import java.util.concurrent.ConcurrentHashMap
 @ReactModule(name = AudioConcatModule.NAME)
 class AudioConcatModule(reactContext: ReactApplicationContext) :
@@ -29,6 +35,131 @@ class AudioConcatModule(reactContext: ReactApplicationContext) :
     data class Silence(val durationMs: Double) : AudioDataOrSilence()
   }
+  private data class PCMChunk(
+    val data: ByteArray,
+    val sequenceNumber: Int,
+    val isEndOfStream: Boolean = false
+  ) {
+    companion object {
+      fun endOfStream(sequenceNumber: Int) = PCMChunk(ByteArray(0), sequenceNumber, true)
+    }
+  }
+  // Cache for decoded PCM data
+  private data class CachedPCMData(
+    val chunks: List<ByteArray>,
+    val totalBytes: Long
+  )
+  private data class SilenceCacheKey(
+    val durationMs: Double,
+    val sampleRate: Int,
+    val channelCount: Int
+  )
+  // Buffer pool for silence generation to reduce memory allocations
+  private object SilenceBufferPool {
+    private val pool = ConcurrentHashMap<Int, ByteArray>()
+    private val standardSizes = listOf(4096, 8192, 16384, 32768, 65536, 131072)
+    init {
+      // Pre-allocate common silence buffer sizes
+      standardSizes.forEach { size ->
+        pool[size] = ByteArray(size)
+      }
+      Log.d("AudioConcat", "SilenceBufferPool initialized with ${standardSizes.size} standard sizes")
+    }
+    fun getBuffer(requestedSize: Int): ByteArray {
+      // Find the smallest standard size that fits the request
+      val standardSize = standardSizes.firstOrNull { it >= requestedSize }
+      return if (standardSize != null) {
+        // Return pooled buffer (already zeroed)
+        pool.getOrPut(standardSize) { ByteArray(standardSize) }
+      } else {
+        // Size too large for pool, create new buffer
+        ByteArray(requestedSize)
+      }
+    }
+    fun clear() {
+      pool.clear()
+      Log.d("AudioConcat", "SilenceBufferPool cleared")
+    }
+  }
+  private class PCMCache(
+    private val shouldCacheFile: Set<String>,
+    private val shouldCacheSilence: Set<SilenceCacheKey>
+  ) {
+    private val audioFileCache = ConcurrentHashMap<String, CachedPCMData>()
+    private val silenceCache = ConcurrentHashMap<SilenceCacheKey, ByteArray>()
+    private var currentCacheSizeBytes = 0L
+    // Dynamic cache size based on available memory
+    private val maxCacheSizeBytes: Long
+      get() {
+        val runtime = Runtime.getRuntime()
+        val maxMemory = runtime.maxMemory()
+        val usedMemory = runtime.totalMemory() - runtime.freeMemory()
+        val availableMemory = maxMemory - usedMemory
+        // Use 20% of available memory for cache, but constrain between 50MB and 200MB
+        val dynamicCacheMB = (availableMemory / (1024 * 1024) * 0.2).toLong()
+        val cacheMB = dynamicCacheMB.coerceIn(50, 200)
+        return cacheMB * 1024 * 1024
+      }
+    fun getAudioFile(filePath: String): CachedPCMData? {
+      return audioFileCache[filePath]
+    }
+    fun putAudioFile(filePath: String, data: CachedPCMData) {
+      // Only cache if this file appears multiple times
+      if (!shouldCacheFile.contains(filePath)) {
+        return
+      }
+      // Check cache size limit (dynamic)
+      if (currentCacheSizeBytes + data.totalBytes > maxCacheSizeBytes) {
+        val maxCacheMB = maxCacheSizeBytes / (1024 * 1024)
+        Log.d("AudioConcat", "Cache full ($maxCacheMB MB), not caching: $filePath")
+        return
+      }
+      audioFileCache[filePath] = data
+      currentCacheSizeBytes += data.totalBytes
+      Log.d("AudioConcat", "Cached audio file: $filePath (${data.totalBytes / 1024}KB, total: ${currentCacheSizeBytes / 1024}KB)")
+    }
+    fun getSilence(key: SilenceCacheKey): ByteArray? {
+      return silenceCache[key]
+    }
+    fun putSilence(key: SilenceCacheKey, data: ByteArray) {
+      // Only cache if this silence pattern appears multiple times
+      if (!shouldCacheSilence.contains(key)) {
+        return
+      }
+      silenceCache[key] = data
+      Log.d("AudioConcat", "Cached silence: ${key.durationMs}ms")
+    }
+    fun clear() {
+      audioFileCache.clear()
+      silenceCache.clear()
+      currentCacheSizeBytes = 0
+      Log.d("AudioConcat", "Cache cleared")
+    }
+    fun getStats(): String {
+      return "Audio files: ${audioFileCache.size}, Silence patterns: ${silenceCache.size}, Size: ${currentCacheSizeBytes / 1024}KB"
+    }
+  }
   private fun extractAudioConfig(filePath: String): AudioConfig {
     val extractor = MediaExtractor()
     try {
@@ -67,6 +198,7 @@ class AudioConcatModule(reactContext: ReactApplicationContext) :
     private var totalPresentationTimeUs = 0L
     private val sampleRate: Int
     private val channelCount: Int
+    private val maxChunkSize: Int
     init {
       this.sampleRate = sampleRate
@@ -79,7 +211,20 @@ class AudioConcatModule(reactContext: ReactApplicationContext) :
       )
       outputFormat.setInteger(MediaFormat.KEY_AAC_PROFILE, MediaCodecInfo.CodecProfileLevel.AACObjectLC)
       outputFormat.setInteger(MediaFormat.KEY_BIT_RATE, bitRate)
-      outputFormat.setInteger(MediaFormat.KEY_MAX_INPUT_SIZE, 16384)
+      // Optimized buffer size based on audio parameters
+      // Target: ~1024 samples per frame for optimal AAC encoding
+      val samplesPerFrame = 1024
+      val bytesPerSample = channelCount * 2 // 16-bit PCM
+      val optimalBufferSize = samplesPerFrame * bytesPerSample
+      // Use at least the optimal size, but allow for some overhead
+      val bufferSize = (optimalBufferSize * 1.5).toInt().coerceAtLeast(16384)
+      outputFormat.setInteger(MediaFormat.KEY_MAX_INPUT_SIZE, bufferSize)
+      // Store for use in encodePCMChunk
+      this.maxChunkSize = bufferSize
+      Log.d("AudioConcat", "Encoder buffer size: $bufferSize bytes (${samplesPerFrame} samples, ${sampleRate}Hz, ${channelCount}ch)")
       encoder = MediaCodec.createEncoderByType(MediaFormat.MIMETYPE_AUDIO_AAC)
       encoder.configure(outputFormat, null, null, MediaCodec.CONFIGURE_FLAG_ENCODE)
@@ -89,29 +234,55 @@ class AudioConcatModule(reactContext: ReactApplicationContext) :
     }
     fun encodePCMChunk(pcmData: ByteArray, isLast: Boolean = false): Boolean {
-      // Feed PCM data to encoder
-      val inputBufferIndex = encoder.dequeueInputBuffer(10000)
-      if (inputBufferIndex >= 0) {
-        val inputBuffer = encoder.getInputBuffer(inputBufferIndex)!!
-        inputBuffer.clear()
-        inputBuffer.put(pcmData)
+      // Split large PCM data into smaller chunks that fit in encoder buffer (use configured size)
+      var offset = 0
+      while (offset < pcmData.size) {
+        val chunkSize = minOf(maxChunkSize, pcmData.size - offset)
+        val isLastChunk = (offset + chunkSize >= pcmData.size) && isLast
+        // Feed PCM data chunk to encoder (reduced timeout for better throughput)
+        val inputBufferIndex = encoder.dequeueInputBuffer(1000)
+        if (inputBufferIndex >= 0) {
+          val inputBuffer = encoder.getInputBuffer(inputBufferIndex)!!
+          val bufferCapacity = inputBuffer.capacity()
+          // Ensure chunk fits in buffer
+          val actualChunkSize = minOf(chunkSize, bufferCapacity)
+          inputBuffer.clear()
+          inputBuffer.put(pcmData, offset, actualChunkSize)
-        val presentationTimeUs = totalPresentationTimeUs
-        totalPresentationTimeUs += (pcmData.size.toLong() * 1_000_000) / (sampleRate * channelCount * 2)
+          val presentationTimeUs = totalPresentationTimeUs
+          totalPresentationTimeUs += (actualChunkSize.toLong() * 1_000_000) / (sampleRate * channelCount * 2)
-        val flags = if (isLast) MediaCodec.BUFFER_FLAG_END_OF_STREAM else 0
-        encoder.queueInputBuffer(inputBufferIndex, 0, pcmData.size, presentationTimeUs, flags)
+          val flags = if (isLastChunk) MediaCodec.BUFFER_FLAG_END_OF_STREAM else 0
+          encoder.queueInputBuffer(inputBufferIndex, 0, actualChunkSize, presentationTimeUs, flags)
+          offset += actualChunkSize
+        } else {
+          // Buffer not available, drain first
+          drainEncoder(false)
+        }
+        // Drain encoder output periodically
+        if (offset < pcmData.size || !isLastChunk) {
+          drainEncoder(false)
+        }
       }
-      // Drain encoder output
-      drainEncoder(isLast)
+      // Final drain if last chunk
+      if (isLast) {
+        drainEncoder(true)
+      }
       return true
     }
     private fun drainEncoder(endOfStream: Boolean) {
       while (true) {
-        val outputBufferIndex = encoder.dequeueOutputBuffer(bufferInfo, if (endOfStream) 10000 else 0)
+        // Use shorter timeout for better responsiveness
+        val outputBufferIndex = encoder.dequeueOutputBuffer(bufferInfo, if (endOfStream) 1000 else 0)
         when (outputBufferIndex) {
           MediaCodec.INFO_OUTPUT_FORMAT_CHANGED -> {
@@ -156,8 +327,8 @@ class AudioConcatModule(reactContext: ReactApplicationContext) :
     }
     fun finish() {
-      // Signal end of stream
-      val inputBufferIndex = encoder.dequeueInputBuffer(10000)
+      // Signal end of stream (reduced timeout)
+      val inputBufferIndex = encoder.dequeueInputBuffer(1000)
       if (inputBufferIndex >= 0) {
         encoder.queueInputBuffer(inputBufferIndex, 0, 0, 0, MediaCodec.BUFFER_FLAG_END_OF_STREAM)
       }
@@ -175,10 +346,274 @@ class AudioConcatModule(reactContext: ReactApplicationContext) :
     }
   }
+  private fun resamplePCM16(
+    input: ByteArray,
+    inputSampleRate: Int,
+    outputSampleRate: Int,
+    channelCount: Int
+  ): ByteArray {
+    if (inputSampleRate == outputSampleRate) {
+      return input
+    }
+    val inputSampleCount = input.size / (2 * channelCount) // 16-bit = 2 bytes per sample
+    val outputSampleCount = (inputSampleCount.toLong() * outputSampleRate / inputSampleRate).toInt()
+    val output = ByteArray(outputSampleCount * 2 * channelCount)
+    // Use fixed-point arithmetic (16.16 format) to avoid floating-point operations
+    // This provides 3-5x performance improvement
+    val step = ((inputSampleRate.toLong() shl 16) / outputSampleRate).toInt()
+    var srcPos = 0
+    for (i in 0 until outputSampleCount) {
+      val srcIndex = srcPos shr 16
+      val fraction = srcPos and 0xFFFF // Fractional part in 16-bit fixed-point
+      // Boundary check: ensure we don't go beyond input array
+      if (srcIndex >= inputSampleCount - 1) {
+        break
+      }
+      for (ch in 0 until channelCount) {
+        // Get current and next sample indices
+        val idx1 = (srcIndex * channelCount + ch) * 2
+        val idx2 = ((srcIndex + 1) * channelCount + ch) * 2
+        // Read 16-bit samples (little-endian)
+        val sample1 = (input[idx1].toInt() and 0xFF) or (input[idx1 + 1].toInt() shl 8)
+        val sample2 = if (idx2 + 1 < input.size) {
+          (input[idx2].toInt() and 0xFF) or (input[idx2 + 1].toInt() shl 8)
+        } else {
+          sample1
+        }
+        // Convert to signed 16-bit
+        val s1 = if (sample1 > 32767) sample1 - 65536 else sample1
+        val s2 = if (sample2 > 32767) sample2 - 65536 else sample2
+        // Linear interpolation using integer arithmetic
+        // interpolated = s1 + (s2 - s1) * fraction
+        // fraction is in 16.16 format, so we shift right by 16 after multiplication
+        val interpolated = s1 + (((s2 - s1) * fraction) shr 16)
+        // Clamp to 16-bit range
+        val clamped = interpolated.coerceIn(-32768, 32767)
+        // Convert back to unsigned and write (little-endian)
+        val outIdx = (i * channelCount + ch) * 2
+        output[outIdx] = (clamped and 0xFF).toByte()
+        output[outIdx + 1] = (clamped shr 8).toByte()
+      }
+      srcPos += step
+    }
+    return output
+  }
+  private fun convertChannelCount(
+    input: ByteArray,
+    inputChannels: Int,
+    outputChannels: Int
+  ): ByteArray {
+    if (inputChannels == outputChannels) {
+      return input
+    }
+    val sampleCount = input.size / (2 * inputChannels)
+    val output = ByteArray(sampleCount * 2 * outputChannels)
+    when {
+      inputChannels == 1 && outputChannels == 2 -> {
+        // Mono to Stereo: duplicate the channel
+        for (i in 0 until sampleCount) {
+          val srcIdx = i * 2
+          val dstIdx = i * 4
+          output[dstIdx] = input[srcIdx]
+          output[dstIdx + 1] = input[srcIdx + 1]
+          output[dstIdx + 2] = input[srcIdx]
+          output[dstIdx + 3] = input[srcIdx + 1]
+        }
+      }
+      inputChannels == 2 && outputChannels == 1 -> {
+        // Stereo to Mono: average the channels
+        for (i in 0 until sampleCount) {
+          val srcIdx = i * 4
+          val dstIdx = i * 2
+          val left = (input[srcIdx].toInt() and 0xFF) or (input[srcIdx + 1].toInt() shl 8)
+          val right = (input[srcIdx + 2].toInt() and 0xFF) or (input[srcIdx + 3].toInt() shl 8)
+          val leftSigned = if (left > 32767) left - 65536 else left
+          val rightSigned = if (right > 32767) right - 65536 else right
+          // Use bit shift instead of division for better performance (x / 2 = x >> 1)
+          val avg = ((leftSigned + rightSigned) shr 1).coerceIn(-32768, 32767)
+          output[dstIdx] = (avg and 0xFF).toByte()
+          output[dstIdx + 1] = (avg shr 8).toByte()
+        }
+      }
+      else -> {
+        // Fallback: just take the first channel
+        for (i in 0 until sampleCount) {
+          val srcIdx = i * 2 * inputChannels
+          val dstIdx = i * 2 * outputChannels
+          for (ch in 0 until minOf(inputChannels, outputChannels)) {
+            output[dstIdx + ch * 2] = input[srcIdx + ch * 2]
+            output[dstIdx + ch * 2 + 1] = input[srcIdx + ch * 2 + 1]
+          }
+        }
+      }
+    }
+    return output
+  }
+  private fun parallelDecodeToQueue(
+    filePath: String,
+    queue: BlockingQueue<PCMChunk>,
+    sequenceStart: AtomicInteger,
+    targetSampleRate: Int,
+    targetChannelCount: Int,
+    latch: CountDownLatch,
+    cache: PCMCache
+  ) {
+    try {
+      // Check cache first
+      val cachedData = cache.getAudioFile(filePath)
+      if (cachedData != null) {
+        Log.d("AudioConcat", "Using cached PCM for: $filePath")
+        // Put cached chunks to queue
+        for (chunk in cachedData.chunks) {
+          val seqNum = sequenceStart.getAndIncrement()
+          queue.put(PCMChunk(chunk, seqNum))
+        }
+        latch.countDown()
+        return
+      }
+      val extractor = MediaExtractor()
+      var decoder: MediaCodec? = null
+      val decodedChunks = mutableListOf<ByteArray>()
+      var totalBytes = 0L
+      try {
+        extractor.setDataSource(filePath)
+        var audioTrackIndex = -1
+        var audioFormat: MediaFormat? = null
+        for (i in 0 until extractor.trackCount) {
+          val format = extractor.getTrackFormat(i)
+          val mime = format.getString(MediaFormat.KEY_MIME) ?: continue
+          if (mime.startsWith("audio/")) {
+            audioTrackIndex = i
+            audioFormat = format
+            break
+          }
+        }
+        if (audioTrackIndex == -1 || audioFormat == null) {
+          throw Exception("No audio track found in $filePath")
+        }
+        val sourceSampleRate = audioFormat.getInteger(MediaFormat.KEY_SAMPLE_RATE)
+        val sourceChannelCount = audioFormat.getInteger(MediaFormat.KEY_CHANNEL_COUNT)
+        val needsResampling = sourceSampleRate != targetSampleRate
+        val needsChannelConversion = sourceChannelCount != targetChannelCount
+        if (needsResampling || needsChannelConversion) {
+          Log.d("AudioConcat", "Parallel decode: $filePath - ${sourceSampleRate}Hz ${sourceChannelCount}ch -> ${targetSampleRate}Hz ${targetChannelCount}ch")
+        }
+        extractor.selectTrack(audioTrackIndex)
+        val mime = audioFormat.getString(MediaFormat.KEY_MIME)!!
+        decoder = MediaCodec.createDecoderByType(mime)
+        decoder.configure(audioFormat, null, null, 0)
+        decoder.start()
+        val bufferInfo = MediaCodec.BufferInfo()
+        var isEOS = false
+        while (!isEOS) {
+          // Feed input to decoder (reduced timeout for faster processing)
+          val inputBufferIndex = decoder.dequeueInputBuffer(1000)
+          if (inputBufferIndex >= 0) {
+            val inputBuffer = decoder.getInputBuffer(inputBufferIndex)!!
+            val sampleSize = extractor.readSampleData(inputBuffer, 0)
+            if (sampleSize < 0) {
+              decoder.queueInputBuffer(inputBufferIndex, 0, 0, 0, MediaCodec.BUFFER_FLAG_END_OF_STREAM)
+            } else {
+              val presentationTimeUs = extractor.sampleTime
+              decoder.queueInputBuffer(inputBufferIndex, 0, sampleSize, presentationTimeUs, 0)
+              extractor.advance()
+            }
+          }
+          // Get PCM output from decoder and put to queue (reduced timeout)
+          val outputBufferIndex = decoder.dequeueOutputBuffer(bufferInfo, 1000)
+          if (outputBufferIndex >= 0) {
+            val outputBuffer = decoder.getOutputBuffer(outputBufferIndex)!!
+            if (bufferInfo.size > 0) {
+              var pcmData = ByteArray(bufferInfo.size)
+              outputBuffer.get(pcmData)
+              // Convert channel count if needed
+              if (needsChannelConversion) {
+                pcmData = convertChannelCount(pcmData, sourceChannelCount, targetChannelCount)
+              }
+              // Resample if needed
+              if (needsResampling) {
+                pcmData = resamplePCM16(pcmData, sourceSampleRate, targetSampleRate, targetChannelCount)
+              }
+              // Optimization: avoid unnecessary clone() - store original for caching
+              decodedChunks.add(pcmData)
+              totalBytes += pcmData.size
+              // Put a clone to queue (queue might modify it)
+              val seqNum = sequenceStart.getAndIncrement()
+              queue.put(PCMChunk(pcmData.clone(), seqNum))
+            }
+            decoder.releaseOutputBuffer(outputBufferIndex, false)
+            if ((bufferInfo.flags and MediaCodec.BUFFER_FLAG_END_OF_STREAM) != 0) {
+              isEOS = true
+            }
+          }
+        }
+        // Cache the decoded data
+        if (decodedChunks.isNotEmpty()) {
+          cache.putAudioFile(filePath, CachedPCMData(decodedChunks, totalBytes))
+        }
+      } finally {
+        decoder?.stop()
+        decoder?.release()
+        extractor.release()
+      }
+    } catch (e: Exception) {
+      Log.e("AudioConcat", "Error in parallel decode: ${e.message}", e)
+      throw e
+    } finally {
+      latch.countDown()
+    }
+  }
   private fun streamDecodeAudioFile(
     filePath: String,
     encoder: StreamingEncoder,
-    isLastFile: Boolean
+    isLastFile: Boolean,
+    targetSampleRate: Int,
+    targetChannelCount: Int
   ) {
     val extractor = MediaExtractor()
     var decoder: MediaCodec? = null
@@ -203,6 +638,16 @@ class AudioConcatModule(reactContext: ReactApplicationContext) :
         throw Exception("No audio track found in $filePath")
       }
+      val sourceSampleRate = audioFormat.getInteger(MediaFormat.KEY_SAMPLE_RATE)
+      val sourceChannelCount = audioFormat.getInteger(MediaFormat.KEY_CHANNEL_COUNT)
+      val needsResampling = sourceSampleRate != targetSampleRate
+      val needsChannelConversion = sourceChannelCount != targetChannelCount
+      if (needsResampling || needsChannelConversion) {
+        Log.d("AudioConcat", "File: $filePath - ${sourceSampleRate}Hz ${sourceChannelCount}ch -> ${targetSampleRate}Hz ${targetChannelCount}ch")
+      }
       extractor.selectTrack(audioTrackIndex)
       val mime = audioFormat.getString(MediaFormat.KEY_MIME)!!
@@ -212,11 +657,10 @@ class AudioConcatModule(reactContext: ReactApplicationContext) :
       val bufferInfo = MediaCodec.BufferInfo()
       var isEOS = false
-      val pcmChunkSize = 8192 // Process in 8KB chunks
       while (!isEOS) {
-        // Feed input to decoder
-        val inputBufferIndex = decoder.dequeueInputBuffer(10000)
+        // Feed input to decoder (reduced timeout for faster processing)
+        val inputBufferIndex = decoder.dequeueInputBuffer(1000)
         if (inputBufferIndex >= 0) {
           val inputBuffer = decoder.getInputBuffer(inputBufferIndex)!!
           val sampleSize = extractor.readSampleData(inputBuffer, 0)
@@ -230,16 +674,26 @@ class AudioConcatModule(reactContext: ReactApplicationContext) :
           }
         }
-        // Get PCM output from decoder and feed to encoder
-        val outputBufferIndex = decoder.dequeueOutputBuffer(bufferInfo, 10000)
+        // Get PCM output from decoder and feed to encoder (reduced timeout)
+        val outputBufferIndex = decoder.dequeueOutputBuffer(bufferInfo, 1000)
         if (outputBufferIndex >= 0) {
           val outputBuffer = decoder.getOutputBuffer(outputBufferIndex)!!
           if (bufferInfo.size > 0) {
-            val pcmData = ByteArray(bufferInfo.size)
+            var pcmData = ByteArray(bufferInfo.size)
             outputBuffer.get(pcmData)
-            // Stream to encoder immediately
+            // Convert channel count if needed
+            if (needsChannelConversion) {
+              pcmData = convertChannelCount(pcmData, sourceChannelCount, targetChannelCount)
+            }
+            // Resample if needed
+            if (needsResampling) {
+              pcmData = resamplePCM16(pcmData, sourceSampleRate, targetSampleRate, targetChannelCount)
+            }
+            // Stream to encoder
             encoder.encodePCMChunk(pcmData, false)
           }
@@ -262,24 +716,299 @@ class AudioConcatModule(reactContext: ReactApplicationContext) :
     durationMs: Double,
     encoder: StreamingEncoder,
     sampleRate: Int,
-    channelCount: Int
+    channelCount: Int,
+    cache: PCMCache
   ) {
+    val cacheKey = SilenceCacheKey(durationMs, sampleRate, channelCount)
+    // Check cache first
+    val cachedSilence = cache.getSilence(cacheKey)
+    if (cachedSilence != null) {
+      Log.d("AudioConcat", "Using cached silence: ${durationMs}ms")
+      encoder.encodePCMChunk(cachedSilence, false)
+      return
+    }
+    // Generate silence
     val totalSamples = ((durationMs / 1000.0) * sampleRate).toInt()
-    val chunkSamples = 4096 // Process in chunks
     val bytesPerSample = channelCount * 2 // 16-bit stereo
+    val totalBytes = totalSamples * bytesPerSample
-    var samplesRemaining = totalSamples
+    // For short silence (< 5 seconds), cache as single chunk
+    if (durationMs < 5000) {
+      // Use buffer pool to avoid allocation
+      val pooledBuffer = SilenceBufferPool.getBuffer(totalBytes)
+      val silenceData = if (pooledBuffer.size == totalBytes) {
+        pooledBuffer
+      } else {
+        // Copy only the needed portion
+        pooledBuffer.copyOf(totalBytes)
+      }
+      cache.putSilence(cacheKey, silenceData)
+      encoder.encodePCMChunk(silenceData, false)
+    } else {
+      // For longer silence, process in chunks without caching using pooled buffers
+      val chunkSamples = 16384
+      var samplesRemaining = totalSamples
-    while (samplesRemaining > 0) {
-      val currentChunkSamples = minOf(chunkSamples, samplesRemaining)
-      val chunkBytes = currentChunkSamples * bytesPerSample
-      val silenceChunk = ByteArray(chunkBytes) // All zeros = silence
+      while (samplesRemaining > 0) {
+        val currentChunkSamples = minOf(chunkSamples, samplesRemaining)
+        val chunkBytes = currentChunkSamples * bytesPerSample
-      encoder.encodePCMChunk(silenceChunk, false)
-      samplesRemaining -= currentChunkSamples
+        // Use pooled buffer for chunk
+        val pooledBuffer = SilenceBufferPool.getBuffer(chunkBytes)
+        val silenceChunk = if (pooledBuffer.size == chunkBytes) {
+          pooledBuffer
+        } else {
+          pooledBuffer.copyOf(chunkBytes)
+        }
+        encoder.encodePCMChunk(silenceChunk, false)
+        samplesRemaining -= currentChunkSamples
+      }
+    }
+  }
+  private fun getOptimalThreadCount(audioFileCount: Int): Int {
+    val cpuCores = Runtime.getRuntime().availableProcessors()
+    val optimalThreads = when {
+      cpuCores <= 2 -> 2
+      cpuCores <= 4 -> 3
+      cpuCores <= 8 -> 4
+      else -> 6
+    }
+    // Don't create more threads than files to process
+    return optimalThreads.coerceAtMost(audioFileCount)
+  }
+  private fun getOptimalQueueSize(audioFileCount: Int): Int {
+    // Dynamic queue size based on number of files to prevent memory waste or blocking
+    return when {
+      audioFileCount <= 5 -> 20
+      audioFileCount <= 20 -> 50
+      audioFileCount <= 50 -> 100
+      else -> 150
     }
   }
+  private fun parallelProcessAudioFiles(
+    audioFiles: List<Pair<Int, String>>, // (index, filePath)
+    encoder: StreamingEncoder,
+    targetSampleRate: Int,
+    targetChannelCount: Int,
+    cache: PCMCache,
+    numThreads: Int = 3
+  ) {
+    if (audioFiles.isEmpty()) return
+    // Group consecutive duplicate files
+    val optimizedFiles = mutableListOf<Pair<Int, String>>()
+    val consecutiveDuplicates = mutableMapOf<Int, Int>() // originalIndex -> count
+    var i = 0
+    while (i < audioFiles.size) {
+      val (index, filePath) = audioFiles[i]
+      var count = 1
+      // Check for consecutive duplicates
+      while (i + count < audioFiles.size && audioFiles[i + count].second == filePath) {
+        count++
+      }
+      if (count > 1) {
+        Log.d("AudioConcat", "Detected $count consecutive occurrences of: $filePath")
+        optimizedFiles.add(Pair(index, filePath))
+        consecutiveDuplicates[optimizedFiles.size - 1] = count
+      } else {
+        optimizedFiles.add(Pair(index, filePath))
+      }
+      i += count
+    }
+    val queueSize = getOptimalQueueSize(optimizedFiles.size)
+    val pcmQueue = LinkedBlockingQueue<PCMChunk>(queueSize)
+    Log.d("AudioConcat", "Using queue size: $queueSize for ${optimizedFiles.size} files")
+    val executor = Executors.newFixedThreadPool(numThreads)
+    val latch = CountDownLatch(optimizedFiles.size)
+    val sequenceCounter = AtomicInteger(0)
+    try {
+      // Submit decode tasks for unique files only
+      optimizedFiles.forEachIndexed { optIndex, (index, filePath) ->
+        executor.submit {
+          try {
+            val fileSequenceStart = AtomicInteger(sequenceCounter.get())
+            sequenceCounter.addAndGet(1000000)
+            Log.d("AudioConcat", "Starting parallel decode [$index]: $filePath")
+            parallelDecodeToQueue(filePath, pcmQueue, fileSequenceStart, targetSampleRate, targetChannelCount, latch, cache)
+            // Mark end with duplicate count
+            val repeatCount = consecutiveDuplicates[optIndex] ?: 1
+            val endSeqNum = fileSequenceStart.get()
+            pcmQueue.put(PCMChunk(ByteArray(0), endSeqNum, true)) // endOfStream marker with repeat count
+          } catch (e: Exception) {
+            Log.e("AudioConcat", "Error decoding file $filePath: ${e.message}", e)
+            latch.countDown()
+          }
+        }
+      }
+      // Consumer thread: encode in order
+      var filesCompleted = 0
+      var cachedChunks = mutableListOf<ByteArray>()
+      var isCollectingChunks = false
+      while (filesCompleted < optimizedFiles.size) {
+        val chunk = pcmQueue.take()
+        if (chunk.isEndOfStream) {
+          val optIndex = filesCompleted
+          val repeatCount = consecutiveDuplicates[optIndex] ?: 1
+          if (repeatCount > 1 && cachedChunks.isNotEmpty()) {
+            // Repeat the cached chunks
+            Log.d("AudioConcat", "Repeating cached chunks ${repeatCount - 1} more times")
+            repeat(repeatCount - 1) {
+              cachedChunks.forEach { data ->
+                encoder.encodePCMChunk(data, false)
+              }
+            }
+            cachedChunks.clear()
+          }
+          filesCompleted++
+          isCollectingChunks = false
+          Log.d("AudioConcat", "Completed file $filesCompleted/${optimizedFiles.size}")
+          continue
+        }
+        // Encode chunk
+        encoder.encodePCMChunk(chunk.data, false)
+        // Cache chunks for consecutive duplicates
+        val optIndex = filesCompleted
+        if (consecutiveDuplicates.containsKey(optIndex)) {
+          cachedChunks.add(chunk.data.clone())
+        }
+      }
+      // Wait for all decode tasks to complete
+      latch.await()
+      Log.d("AudioConcat", "All parallel decode tasks completed")
+    } finally {
+      executor.shutdown()
+    }
+  }
+  private data class InterleavedPattern(
+    val filePath: String,
+    val silenceKey: SilenceCacheKey?,
+    val indices: List<Int>, // Indices where this pattern occurs
+    val repeatCount: Int
+  )
+  private data class DuplicateAnalysis(
+    val duplicateFiles: Set<String>,
+    val duplicateSilence: Set<SilenceCacheKey>,
+    val fileOccurrences: Map<String, List<Int>>, // filePath -> list of indices
+    val silenceOccurrences: Map<SilenceCacheKey, List<Int>>,
+    val interleavedPatterns: List<InterleavedPattern>
+  )
+  private fun analyzeDuplicates(
+    parsedData: List<AudioDataOrSilence>,
+    audioConfig: AudioConfig
+  ): DuplicateAnalysis {
+    val fileCounts = mutableMapOf<String, MutableList<Int>>()
+    val silenceCounts = mutableMapOf<SilenceCacheKey, MutableList<Int>>()
+    parsedData.forEachIndexed { index, item ->
+      when (item) {
+        is AudioDataOrSilence.AudioFile -> {
+          fileCounts.getOrPut(item.filePath) { mutableListOf() }.add(index)
+        }
+        is AudioDataOrSilence.Silence -> {
+          val key = SilenceCacheKey(item.durationMs, audioConfig.sampleRate, audioConfig.channelCount)
+          silenceCounts.getOrPut(key) { mutableListOf() }.add(index)
+        }
+      }
+    }
+    val duplicateFiles = fileCounts.filter { it.value.size > 1 }.keys.toSet()
+    val duplicateSilence = silenceCounts.filter { it.value.size > 1 }.keys.toSet()
+    // Detect interleaved patterns: file -> silence -> file -> silence -> file
+    val interleavedPatterns = mutableListOf<InterleavedPattern>()
+    var i = 0
+    while (i < parsedData.size - 2) {
+      if (parsedData[i] is AudioDataOrSilence.AudioFile &&
+          parsedData[i + 1] is AudioDataOrSilence.Silence &&
+          parsedData[i + 2] is AudioDataOrSilence.AudioFile) {
+        val file1 = (parsedData[i] as AudioDataOrSilence.AudioFile).filePath
+        val silence = parsedData[i + 1] as AudioDataOrSilence.Silence
+        val file2 = (parsedData[i + 2] as AudioDataOrSilence.AudioFile).filePath
+        val silenceKey = SilenceCacheKey(silence.durationMs, audioConfig.sampleRate, audioConfig.channelCount)
+        // Check if it's the same file with silence separator
+        if (file1 == file2) {
+          var count = 1
+          var currentIndex = i
+          val indices = mutableListOf(i)
+          // Count how many times this pattern repeats
+          while (currentIndex + 2 < parsedData.size &&
+                 parsedData[currentIndex + 2] is AudioDataOrSilence.AudioFile &&
+                 (parsedData[currentIndex + 2] as AudioDataOrSilence.AudioFile).filePath == file1) {
+            // Check if there's a silence in between
+            if (currentIndex + 3 < parsedData.size &&
+                parsedData[currentIndex + 3] is AudioDataOrSilence.Silence) {
+              val nextSilence = parsedData[currentIndex + 3] as AudioDataOrSilence.Silence
+              val nextSilenceKey = SilenceCacheKey(nextSilence.durationMs, audioConfig.sampleRate, audioConfig.channelCount)
+              if (nextSilenceKey == silenceKey) {
+                count++
+                currentIndex += 2
+                indices.add(currentIndex)
+              } else {
+                break
+              }
+            } else {
+              // Last file in the pattern (no silence after)
+              count++
+              indices.add(currentIndex + 2)
+              break
+            }
+          }
+          if (count >= 2) {
+            interleavedPatterns.add(InterleavedPattern(file1, silenceKey, indices, count))
+            Log.d("AudioConcat", "Detected interleaved pattern: '$file1' + ${silenceKey.durationMs}ms silence, repeats $count times")
+            i = currentIndex + 2 // Skip processed items
+            continue
+          }
+        }
+      }
+      i++
+    }
+    Log.d("AudioConcat", "Duplicate analysis: ${duplicateFiles.size} files, ${duplicateSilence.size} silence patterns, ${interleavedPatterns.size} interleaved patterns")
+    duplicateFiles.forEach { file ->
+      Log.d("AudioConcat", "  File '$file' appears ${fileCounts[file]?.size} times")
+    }
+    duplicateSilence.forEach { key ->
+      Log.d("AudioConcat", "  Silence ${key.durationMs}ms appears ${silenceCounts[key]?.size} times")
+    }
+    return DuplicateAnalysis(duplicateFiles, duplicateSilence, fileCounts, silenceCounts, interleavedPatterns)
+  }
   private fun parseAudioData(data: ReadableArray): List<AudioDataOrSilence> {
     val result = mutableListOf<AudioDataOrSilence>()
     for (i in 0 until data.size()) {
@@ -329,6 +1058,12 @@ class AudioConcatModule(reactContext: ReactApplicationContext) :
       Log.d("AudioConcat", "Audio config: ${audioConfig.sampleRate}Hz, ${audioConfig.channelCount}ch, ${audioConfig.bitRate}bps")
+      // Analyze duplicates to determine cache strategy
+      val duplicateAnalysis = analyzeDuplicates(parsedData, audioConfig)
+      // Create cache instance with intelligent caching strategy
+      val cache = PCMCache(duplicateAnalysis.duplicateFiles, duplicateAnalysis.duplicateSilence)
       // Delete existing output file
       val outputFile = File(outputPath)
       if (outputFile.exists()) {
@@ -344,33 +1079,194 @@ class AudioConcatModule(reactContext: ReactApplicationContext) :
       )
       try {
-        // Process each item
+        // Separate audio files and other items (silence)
+        val audioFileItems = mutableListOf<Pair<Int, String>>()
+        val nonAudioItems = mutableListOf<Pair<Int, AudioDataOrSilence>>()
         for ((index, item) in parsedData.withIndex()) {
           when (item) {
             is AudioDataOrSilence.AudioFile -> {
-              val filePath = item.filePath
-              Log.d("AudioConcat", "Item $index: Streaming decode $filePath")
+              audioFileItems.add(Pair(index, item.filePath))
+            }
+            is AudioDataOrSilence.Silence -> {
+              nonAudioItems.add(Pair(index, item))
+            }
+          }
+        }
+        // Decide whether to use parallel or sequential processing
+        val useParallel = audioFileItems.size >= 10 // Use parallel for 10+ files
+        if (useParallel) {
+          Log.d("AudioConcat", "Using parallel processing for ${audioFileItems.size} audio files")
-              val isLastFile = (index == parsedData.size - 1)
-              streamDecodeAudioFile(filePath, encoder, isLastFile)
+          // Process interleaved patterns optimally
+          val processedIndices = mutableSetOf<Int>()
+          // First, handle all interleaved patterns
+          duplicateAnalysis.interleavedPatterns.forEach { pattern ->
+            Log.d("AudioConcat", "Processing interleaved pattern: ${pattern.filePath}, ${pattern.repeatCount} repetitions")
+            // Decode the file once
+            val filePath = pattern.filePath
+            val cachedData = cache.getAudioFile(filePath)
+            val pcmChunks = if (cachedData != null) {
+              Log.d("AudioConcat", "Using cached PCM for interleaved pattern: $filePath")
+              cachedData.chunks
+            } else {
+              // Decode once and store
+              val chunks = mutableListOf<ByteArray>()
+              val tempQueue = LinkedBlockingQueue<PCMChunk>(100)
+              val latch = CountDownLatch(1)
+              val seqStart = AtomicInteger(0)
+              parallelDecodeToQueue(filePath, tempQueue, seqStart, audioConfig.sampleRate, audioConfig.channelCount, latch, cache)
+              // Collect chunks
+              var collecting = true
+              while (collecting) {
+                val chunk = tempQueue.poll(100, java.util.concurrent.TimeUnit.MILLISECONDS)
+                if (chunk != null) {
+                  if (!chunk.isEndOfStream) {
+                    chunks.add(chunk.data)
+                  } else {
+                    collecting = false
+                  }
+                } else if (latch.count == 0L) {
+                  collecting = false
+                }
+              }
+              latch.await()
+              chunks
             }
-            is AudioDataOrSilence.Silence -> {
-              val durationMs = item.durationMs
-              Log.d("AudioConcat", "Item $index: Streaming silence ${durationMs}ms")
-              streamEncodeSilence(
-                durationMs,
-                encoder,
-                audioConfig.sampleRate,
-                audioConfig.channelCount
-              )
+            // Get silence PCM
+            val silencePCM = pattern.silenceKey?.let { cache.getSilence(it) }
+              ?: pattern.silenceKey?.let {
+                val totalSamples = ((it.durationMs / 1000.0) * it.sampleRate).toInt()
+                val bytesPerSample = it.channelCount * 2
+                ByteArray(totalSamples * bytesPerSample)
+              }
+            // Encode the pattern: file -> silence -> file -> silence -> ...
+            repeat(pattern.repeatCount) { iteration ->
+              // Encode file
+              pcmChunks.forEach { chunk ->
+                encoder.encodePCMChunk(chunk, false)
+              }
+              // Encode silence (except after the last file)
+              if (iteration < pattern.repeatCount - 1 && silencePCM != null) {
+                encoder.encodePCMChunk(silencePCM, false)
+              }
+            }
+            // Mark these indices as processed
+            pattern.indices.forEach { idx ->
+              processedIndices.add(idx)
+              if (idx + 1 < parsedData.size && parsedData[idx + 1] is AudioDataOrSilence.Silence) {
+                processedIndices.add(idx + 1)
+              }
+            }
+          }
+          // Then process remaining items normally
+          var audioFileIdx = 0
+          for ((index, item) in parsedData.withIndex()) {
+            if (processedIndices.contains(index)) {
+              if (item is AudioDataOrSilence.AudioFile) audioFileIdx++
+              continue
+            }
+            when (item) {
+              is AudioDataOrSilence.AudioFile -> {
+                // Collect consecutive audio files for parallel processing
+                val consecutiveFiles = mutableListOf<Pair<Int, String>>()
+                var currentIdx = audioFileIdx
+                while (currentIdx < audioFileItems.size) {
+                  val (itemIdx, filePath) = audioFileItems[currentIdx]
+                  if (processedIndices.contains(itemIdx)) {
+                    currentIdx++
+                    continue
+                  }
+                  if (itemIdx != index + (currentIdx - audioFileIdx)) break
+                  consecutiveFiles.add(Pair(itemIdx, filePath))
+                  currentIdx++
+                }
+                if (consecutiveFiles.isNotEmpty()) {
+                  val optimalThreads = getOptimalThreadCount(consecutiveFiles.size)
+                  Log.d("AudioConcat", "Using $optimalThreads threads for ${consecutiveFiles.size} files (CPU cores: ${Runtime.getRuntime().availableProcessors()})")
+                  parallelProcessAudioFiles(
+                    consecutiveFiles,
+                    encoder,
+                    audioConfig.sampleRate,
+                    audioConfig.channelCount,
+                    cache,
+                    numThreads = optimalThreads
+                  )
+                  audioFileIdx = currentIdx
+                }
+              }
+              is AudioDataOrSilence.Silence -> {
+                val durationMs = item.durationMs
+                Log.d("AudioConcat", "Item $index: Streaming silence ${durationMs}ms")
+                streamEncodeSilence(
+                  durationMs,
+                  encoder,
+                  audioConfig.sampleRate,
+                  audioConfig.channelCount,
+                  cache
+                )
+              }
+            }
+          }
+        } else {
+          Log.d("AudioConcat", "Using sequential processing for ${audioFileItems.size} audio files")
+          // Process each item sequentially (original behavior)
+          for ((index, item) in parsedData.withIndex()) {
+            when (item) {
+              is AudioDataOrSilence.AudioFile -> {
+                val filePath = item.filePath
+                Log.d("AudioConcat", "Item $index: Streaming decode $filePath")
+                val isLastFile = (index == parsedData.size - 1)
+                streamDecodeAudioFile(
+                  filePath,
+                  encoder,
+                  isLastFile,
+                  audioConfig.sampleRate,
+                  audioConfig.channelCount
+                )
+              }
+              is AudioDataOrSilence.Silence -> {
+                val durationMs = item.durationMs
+                Log.d("AudioConcat", "Item $index: Streaming silence ${durationMs}ms")
+                streamEncodeSilence(
+                  durationMs,
+                  encoder,
+                  audioConfig.sampleRate,
+                  audioConfig.channelCount,
+                  cache
+                )
+              }
             }
           }
         }
         // Finish encoding
         encoder.finish()
+        // Log cache statistics
+        Log.d("AudioConcat", "Cache statistics: ${cache.getStats()}")
         Log.d("AudioConcat", "Successfully merged audio to $outputPath")
         promise.resolve(outputPath)

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "react-native-audio-concat",
-  "version": "0.3.0",
+  "version": "0.5.0",
   "description": "audio-concat for react-native",
   "main": "./lib/module/index.js",
   "types": "./lib/typescript/src/index.d.ts",