npm - @siteed/expo-audio-stream - Versions diffs - 1.17.0 → 2.0.1 - Mend

@siteed/expo-audio-stream 1.17.0 → 2.0.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (74) hide show

package/CHANGELOG.md +26 -1
package/README.md +1 -1
package/android/src/main/java/net/siteed/audiostream/AudioAnalysisData.kt +68 -22
package/android/src/main/java/net/siteed/audiostream/AudioFormatUtils.kt +24 -0
package/android/src/main/java/net/siteed/audiostream/AudioProcessor.kt +836 -386
package/android/src/main/java/net/siteed/audiostream/AudioRecorderManager.kt +0 -2
package/android/src/main/java/net/siteed/audiostream/AudioRecordingService.kt +35 -29
package/android/src/main/java/net/siteed/audiostream/ExpoAudioStreamModule.kt +236 -96
package/android/src/main/java/net/siteed/audiostream/FFT.kt +55 -0
package/android/src/main/java/net/siteed/audiostream/Features.kt +49 -7
package/android/src/main/java/net/siteed/audiostream/RecordingConfig.kt +2 -4
package/build/AudioAnalysis/AudioAnalysis.types.d.ts +55 -47
package/build/AudioAnalysis/AudioAnalysis.types.d.ts.map +1 -1
package/build/AudioAnalysis/AudioAnalysis.types.js.map +1 -1
package/build/AudioAnalysis/extractAudioAnalysis.d.ts +60 -13
package/build/AudioAnalysis/extractAudioAnalysis.d.ts.map +1 -1
package/build/AudioAnalysis/extractAudioAnalysis.js +147 -162
package/build/AudioAnalysis/extractAudioAnalysis.js.map +1 -1
package/build/ExpoAudioStream.types.d.ts +47 -3
package/build/ExpoAudioStream.types.d.ts.map +1 -1
package/build/ExpoAudioStream.types.js.map +1 -1
package/build/ExpoAudioStream.web.d.ts.map +1 -1
package/build/ExpoAudioStream.web.js +0 -1
package/build/ExpoAudioStream.web.js.map +1 -1
package/build/ExpoAudioStreamModule.d.ts.map +1 -1
package/build/ExpoAudioStreamModule.js +216 -12
package/build/ExpoAudioStreamModule.js.map +1 -1
package/build/WebRecorder.web.d.ts +67 -13
package/build/WebRecorder.web.d.ts.map +1 -1
package/build/WebRecorder.web.js +177 -173
package/build/WebRecorder.web.js.map +1 -1
package/build/index.d.ts +3 -3
package/build/index.d.ts.map +1 -1
package/build/index.js +2 -2
package/build/index.js.map +1 -1
package/build/useAudioRecorder.d.ts.map +1 -1
package/build/useAudioRecorder.js +12 -8
package/build/useAudioRecorder.js.map +1 -1
package/build/utils/audioProcessing.d.ts +24 -0
package/build/utils/audioProcessing.d.ts.map +1 -0
package/build/utils/audioProcessing.js +133 -0
package/build/utils/audioProcessing.js.map +1 -0
package/build/workers/InlineFeaturesExtractor.web.d.ts +1 -1
package/build/workers/InlineFeaturesExtractor.web.d.ts.map +1 -1
package/build/workers/InlineFeaturesExtractor.web.js +694 -194
package/build/workers/InlineFeaturesExtractor.web.js.map +1 -1
package/build/workers/inlineAudioWebWorker.web.d.ts +1 -1
package/build/workers/inlineAudioWebWorker.web.d.ts.map +1 -1
package/build/workers/inlineAudioWebWorker.web.js +3 -2
package/build/workers/inlineAudioWebWorker.web.js.map +1 -1
package/ios/AudioAnalysisData.swift +51 -16
package/ios/AudioProcessingHelpers.swift +710 -26
package/ios/AudioProcessor.swift +334 -185
package/ios/AudioStreamManager.swift +2 -3
package/ios/DataPoint.swift +25 -12
package/ios/DecodingConfig.swift +47 -0
package/ios/ExpoAudioStreamModule.swift +187 -103
package/ios/FFT.swift +62 -0
package/ios/Features.swift +24 -3
package/ios/RecordingSettings.swift +7 -7
package/package.json +2 -1
package/plugin/build/index.js +6 -1
package/plugin/src/index.ts +9 -1
package/src/AudioAnalysis/AudioAnalysis.types.ts +68 -52
package/src/AudioAnalysis/extractAudioAnalysis.ts +223 -219
package/src/ExpoAudioStream.types.ts +53 -7
package/src/ExpoAudioStream.web.ts +0 -1
package/src/ExpoAudioStreamModule.ts +255 -10
package/src/WebRecorder.web.ts +231 -244
package/src/index.ts +5 -3
package/src/useAudioRecorder.tsx +14 -10
package/src/utils/audioProcessing.ts +205 -0
package/src/workers/InlineFeaturesExtractor.web.tsx +694 -194
package/src/workers/inlineAudioWebWorker.web.tsx +3 -2

package/CHANGELOG.md CHANGED Viewed

@@ -8,6 +8,29 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
 ## [Unreleased]
+## [2.0.1] - 2025-02-27
+### Changed
+- refactor: update background mode handling for audio stream plugin ([e7e98cc](https://github.com/deeeed/expo-audio-stream/commit/e7e98cc60b7965770dcf25e9ae74cb356e1e7097))
+- chore(expo-audio-stream): release @siteed/expo-audio-stream@2.0.0 ([356d3f4](https://github.com/deeeed/expo-audio-stream/commit/356d3f40ffb66806eeecb86d12bcbe5d60b7eea6))
+## [2.0.0] - 2025-02-27
+### Changed
+- feat(playground): Enhance Audio Playground with Improved UX and Sample Audio Loading (#148) ([09d2794](https://github.com/deeeed/expo-audio-stream/commit/09d27940dcffa60e662c828742f4577bca5327f9))
+- feat: Implement Enhanced Audio Transcription Workflow with Configurable Extraction and UI Updates (#147) ([c658c7e](https://github.com/deeeed/expo-audio-stream/commit/c658c7e8531dd731b01d9347bc7c744470a3b7b9))
+- fix: audio recording reliability improvements and web IndexedDB management (#146) ([d4fa245](https://github.com/deeeed/expo-audio-stream/commit/d4fa245c46d487fe50c6454165efc2e1032ec126))
+- feat(transcription): refactor and unify transcription services across platforms (#145) ([a94b905](https://github.com/deeeed/expo-audio-stream/commit/a94b90562fb2112f712f78c03ca6a5110d6b1401))
+- feat(audio): enhance checksum verification and audio segment analysis (#143) ([49b6587](https://github.com/deeeed/expo-audio-stream/commit/49b65877d1fd9922f25b4892261c4fedf02ba3c3))
+- feat(playground): implement cross-platform ONNX runtime with Silero VAD model (#142) ([4a94639](https://github.com/deeeed/expo-audio-stream/commit/4a9463995f1eadf6531a2b4d6d057e90da097920))
+- feat(audio-analysis): enhance audio analysis and visualization capabilities (#141) ([ecf8f5d](https://github.com/deeeed/expo-audio-stream/commit/ecf8f5daf967bf27afb827c8cf6bca7510ce7b4e))
+- android 15 (#140) ([5321a3c](https://github.com/deeeed/expo-audio-stream/commit/5321a3c805d22e6824fd11fee4290987d550bd06))
+- refactor(audio): consolidate audio analysis APIs and migrate to segment-based processing (#139) ([5d45da8](https://github.com/deeeed/expo-audio-stream/commit/5d45da871ee1849898405ee4bf8bf8d296aebc48))
+- feat: pcm player (#137) ([8db6f16](https://github.com/deeeed/expo-audio-stream/commit/8db6f16f13cbcf78fd4a8e412bb00689e47d5a72))
+- feat(audio-stream): add extractAudioData API ([faf8915](https://github.com/deeeed/expo-audio-stream/commit/faf8915df3b18ea54ca7e562f61749d7cadf8bb4))
+- feat(audio): improve audio trimming and waveform visualization (#136) ([ad5514b](https://github.com/deeeed/expo-audio-stream/commit/ad5514b412eedc7211cb200cc3747e8a83afbf88))
+- feat(audio): enhance audio player with preview, trimming and feature analysis (#135) ([3f7eb9c](https://github.com/deeeed/expo-audio-stream/commit/3f7eb9cde7b314505d8ed3e4704c7b1321da6b15))
+- feat: add web permission for microphone (#131) ([9a2ed7f](https://github.com/deeeed/expo-audio-stream/commit/9a2ed7f31ad41560d094a22d1248034cb2f5886d))
+- refactor(audio): simplify amplitude analysis and remove redundant configuration (#133) ([5d64aa2](https://github.com/deeeed/expo-audio-stream/commit/5d64aa22299836cc9cb925d3e91f3d9470f3e856))
+- feat: add full audio analysis with spectral features and time range controls (#132) ([5677dc3](https://github.com/deeeed/expo-audio-stream/commit/5677dc321f5a9ff4bea37fbbce3cb6ae3aad67f6))
+- chore(expo-audio-stream): release @siteed/expo-audio-stream@1.17.0 ([689aead](https://github.com/deeeed/expo-audio-stream/commit/689aeadedaa58050cd18e8ec1fa5ff1fcd93f0db))
 ## [1.17.0] - 2025-02-18
 ### Changed
 - feat(web): add audio interval analysis ([281b7e6](https://github.com/deeeed/expo-audio-stream/commit/281b7e6b1136afe0569450a9d1e3d5f01da7af28))
@@ -135,7 +158,9 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
 - Feature: Audio features extraction during recording.
 - Feature: Consistent WAV PCM recording format across all platforms.
-[unreleased]: https://github.com/deeeed/expo-audio-stream/compare/@siteed/expo-audio-stream@1.17.0...HEAD
+[unreleased]: https://github.com/deeeed/expo-audio-stream/compare/@siteed/expo-audio-stream@2.0.1...HEAD
+[2.0.1]: https://github.com/deeeed/expo-audio-stream/compare/@siteed/expo-audio-stream@2.0.0...@siteed/expo-audio-stream@2.0.1
+[2.0.0]: https://github.com/deeeed/expo-audio-stream/compare/@siteed/expo-audio-stream@1.17.0...@siteed/expo-audio-stream@2.0.0
 [1.17.0]: https://github.com/deeeed/expo-audio-stream/compare/@siteed/expo-audio-stream@1.16.0...@siteed/expo-audio-stream@1.17.0
 [1.16.0]: https://github.com/deeeed/expo-audio-stream/compare/@siteed/expo-audio-stream@1.15.1...@siteed/expo-audio-stream@1.16.0
 [1.15.1]: https://github.com/deeeed/expo-audio-stream/compare/@siteed/expo-audio-stream@1.15.0...@siteed/expo-audio-stream@1.15.1

package/README.md CHANGED Viewed

@@ -48,7 +48,7 @@
 - Background audio recording on iOS.
 - Audio features extraction during recording.
 - Consistent WAV PCM recording format across all platforms.
-- Keep device awake during recording sessions
+- Keep recording acrtive while app is in background
 - Rich notification system for recording status:
   - Android: Live waveform visualization in notifications
   - Android: Fully customizable notification appearance and actions

package/android/src/main/java/net/siteed/audiostream/AudioAnalysisData.kt CHANGED Viewed

@@ -4,34 +4,53 @@ package net.siteed.audiostream
 import android.os.Bundle
 import androidx.core.os.bundleOf
+data class SpeechFeatures(
+    val isActive: Boolean,
+    val speakerId: Int? = null
+) {
+    fun toDictionary(): Map<String, Any?> {
+        return mapOf(
+            "isActive" to isActive,
+            "speakerId" to speakerId
+        )
+    }
+    fun toBundle(): Bundle {
+        return bundleOf(
+            "isActive" to isActive,
+            "speakerId" to speakerId
+        )
+    }
+}
 data class DataPoint(
     val id: Long,
     val amplitude: Float,
-    val activeSpeech: Boolean? = null,
-    val dB: Float? = null,
-    val silent: Boolean? = null,
+    val rms: Float,
+    val dB: Float,
+    val silent: Boolean,
     val features: Features? = null,
+    val speech: SpeechFeatures? = null,
     val startTime: Float? = null,
     val endTime: Float? = null,
     val startPosition: Int? = null,
     val endPosition: Int? = null,
-    val samples: Int = 0,
-    val speaker: Int? = null
+    val samples: Int = 0
 ) {
     fun toDictionary(): Map<String, Any?> {
         return mapOf(
             "id" to id,
             "amplitude" to amplitude,
-            "activeSpeech" to activeSpeech,
+            "rms" to rms,
             "dB" to dB,
             "silent" to silent,
             "features" to features?.toDictionary(),
+            "speech" to speech?.toDictionary(),
             "startTime" to startTime,
             "endTime" to endTime,
             "startPosition" to startPosition,
             "endPosition" to endPosition,
-            "samples" to samples,
-            "speaker" to speaker
+            "samples" to samples
         )
     }
@@ -39,22 +58,22 @@ data class DataPoint(
         return bundleOf(
             "id" to id,
             "amplitude" to amplitude,
-            "activeSpeech" to activeSpeech,
+            "rms" to rms,
             "dB" to dB,
             "silent" to silent,
             "features" to features?.toBundle(),
+            "speech" to speech?.toBundle(),
             "startTime" to startTime,
             "endTime" to endTime,
             "startPosition" to startPosition,
             "endPosition" to endPosition,
-            "samples" to samples,
-            "speaker" to speaker
+            "samples" to samples
         )
     }
 }
 data class AudioAnalysisData(
-    val pointsPerSecond: Double,
+    val segmentDurationMs: Int,
     val durationMs: Int,
     val bitDepth: Int,
     val numberOfChannels: Int,
@@ -62,7 +81,8 @@ data class AudioAnalysisData(
     val samples: Int,
     val dataPoints: List<DataPoint>,
     val amplitudeRange: AmplitudeRange,
-    val speakerChanges: List<SpeakerChange>,
+    val rmsRange: AmplitudeRange,
+    val speechAnalysis: SpeechAnalysis? = null,
     val extractionTimeMs: Float
 ) {
     data class AmplitudeRange(val min: Float, val max: Float) {
@@ -75,19 +95,44 @@ data class AudioAnalysisData(
         }
     }
-    data class SpeakerChange(val timestamp: Float, val speaker: Int) {
+    data class SpeechAnalysis(
+        val speakerChanges: List<SpeakerChange>
+    ) {
         fun toDictionary(): Map<String, Any> {
-            return mapOf("timestamp" to timestamp, "speaker" to speaker)
+            return mapOf(
+                "speakerChanges" to speakerChanges.map { it.toDictionary() }
+            )
         }
         fun toBundle(): Bundle {
-            return bundleOf("timestamp" to timestamp, "speaker" to speaker)
+            return bundleOf(
+                "speakerChanges" to speakerChanges.map { it.toBundle() }.toTypedArray()
+            )
         }
     }
-    fun toDictionary(): Map<String, Any> {
+    data class SpeakerChange(
+        val timestamp: Long,
+        val speakerId: Int
+    ) {
+        fun toDictionary(): Map<String, Any> {
+            return mapOf(
+                "timestamp" to timestamp,
+                "speakerId" to speakerId
+            )
+        }
+        fun toBundle(): Bundle {
+            return bundleOf(
+                "timestamp" to timestamp,
+                "speakerId" to speakerId
+            )
+        }
+    }
+    fun toDictionary(): Map<String, Any?> {
         return mapOf(
-            "pointsPerSecond" to pointsPerSecond,
+            "segmentDurationMs" to segmentDurationMs,
             "durationMs" to durationMs,
             "bitDepth" to bitDepth,
             "numberOfChannels" to numberOfChannels,
@@ -95,17 +140,17 @@ data class AudioAnalysisData(
             "samples" to samples,
             "dataPoints" to dataPoints.map { it.toDictionary() },
             "amplitudeRange" to amplitudeRange.toDictionary(),
-            "speakerChanges" to speakerChanges.map { it.toDictionary() },
+            "rmsRange" to rmsRange.toDictionary(),
+            "speechAnalysis" to speechAnalysis?.toDictionary(),
             "extractionTimeMs" to extractionTimeMs
         )
     }
     fun toBundle(): Bundle {
         val dataPointsBundleArray = dataPoints.map { it.toBundle() }.toTypedArray()
-        val speakerChangesBundleArray = speakerChanges.map { it.toBundle() }.toTypedArray()
         return bundleOf(
-            "pointsPerSecond" to pointsPerSecond,
+            "segmentDurationMs" to segmentDurationMs,
             "durationMs" to durationMs,
             "bitDepth" to bitDepth,
             "numberOfChannels" to numberOfChannels,
@@ -113,7 +158,8 @@ data class AudioAnalysisData(
             "samples" to samples,
             "dataPoints" to dataPointsBundleArray,
             "amplitudeRange" to amplitudeRange.toBundle(),
-            "speakerChanges" to speakerChangesBundleArray,
+            "rmsRange" to rmsRange.toBundle(),
+            "speechAnalysis" to speechAnalysis?.toBundle(),
             "extractionTimeMs" to extractionTimeMs
         )
     }

package/android/src/main/java/net/siteed/audiostream/AudioFormatUtils.kt CHANGED Viewed

@@ -76,4 +76,28 @@ object AudioFormatUtils {
             else -> AudioFormat.ENCODING_PCM_16BIT // Default to 16-bit PCM
         }
     }
+    /**
+     * Converts audio data between different bit depths
+     * @param audioData The raw audio data
+     * @param sourceBitDepth The original bit depth
+     * @param targetBitDepth The desired bit depth
+     * @return The converted audio data
+     */
+    fun convertBitDepth(audioData: ByteArray, sourceBitDepth: Int, targetBitDepth: Int): ByteArray {
+        // First convert to float array for normalization
+        val floatArray = convertByteArrayToFloatArray(audioData, "pcm_${sourceBitDepth}bit")
+        // Convert back to bytes with new bit depth
+        return when (targetBitDepth) {
+            8 -> floatArray.map { ((it + 1.0f) * 127.5f).toInt().toByte() }.toByteArray()
+            16 -> ByteBuffer.allocate(floatArray.size * 2).order(ByteOrder.LITTLE_ENDIAN).apply {
+                floatArray.forEach { asShortBuffer().put((it * 32767f).toInt().toShort()) }
+            }.array()
+            32 -> ByteBuffer.allocate(floatArray.size * 4).order(ByteOrder.LITTLE_ENDIAN).apply {
+                floatArray.forEach { putFloat(it) }
+            }.array()
+            else -> throw IllegalArgumentException("Unsupported target bit depth: $targetBitDepth")
+        }
+    }
 }