@siteed/audio-studio 3.0.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/CHANGELOG.md +535 -0
- package/LICENSE +21 -0
- package/README.md +167 -0
- package/android/build.gradle +143 -0
- package/android/src/androidTest/assets/chorus.wav +0 -0
- package/android/src/androidTest/assets/jfk.wav +0 -0
- package/android/src/androidTest/assets/osr_us_000_0010_8k.wav +0 -0
- package/android/src/androidTest/assets/recorder_hello_world.wav +0 -0
- package/android/src/androidTest/java/net/siteed/audiostudio/AudioProcessorInstrumentedTest.kt +197 -0
- package/android/src/androidTest/java/net/siteed/audiostudio/AudioRecorderInstrumentedTest.kt +541 -0
- package/android/src/androidTest/java/net/siteed/audiostudio/AudioRecorderPerformanceInstrumentedTest.kt +234 -0
- package/android/src/androidTest/java/net/siteed/audiostudio/integration/AudioFocusStrategyIntegrationTest.kt +332 -0
- package/android/src/androidTest/java/net/siteed/audiostudio/integration/BufferDurationIntegrationTest.kt +324 -0
- package/android/src/androidTest/java/net/siteed/audiostudio/integration/CompressedOnlyOutputTest.kt +253 -0
- package/android/src/androidTest/java/net/siteed/audiostudio/integration/DeviceDisconnectionFallbackTest.kt +218 -0
- package/android/src/androidTest/java/net/siteed/audiostudio/integration/EventEmissionIntervalTest.kt +120 -0
- package/android/src/androidTest/java/net/siteed/audiostudio/integration/M4aFormatTest.kt +345 -0
- package/android/src/androidTest/java/net/siteed/audiostudio/integration/OutputControlIntegrationTest.kt +340 -0
- package/android/src/androidTest/java/net/siteed/audiostudio/integration/PcmStreamingDurationTest.kt +252 -0
- package/android/src/androidTest/java/net/siteed/audiostudio/integration/README.md +95 -0
- package/android/src/androidTest/java/net/siteed/audiostudio/integration/run_integration_tests.sh +43 -0
- package/android/src/main/AndroidManifest.xml +30 -0
- package/android/src/main/CMakeLists.txt +29 -0
- package/android/src/main/java/net/siteed/audiostudio/AudioAnalysisData.kt +188 -0
- package/android/src/main/java/net/siteed/audiostudio/AudioDataEncoder.kt +9 -0
- package/android/src/main/java/net/siteed/audiostudio/AudioDeviceManager.kt +1741 -0
- package/android/src/main/java/net/siteed/audiostudio/AudioFeaturesNative.kt +26 -0
- package/android/src/main/java/net/siteed/audiostudio/AudioFileHandler.kt +136 -0
- package/android/src/main/java/net/siteed/audiostudio/AudioFormatUtils.kt +354 -0
- package/android/src/main/java/net/siteed/audiostudio/AudioNotificationsManager.kt +439 -0
- package/android/src/main/java/net/siteed/audiostudio/AudioProcessor.kt +2237 -0
- package/android/src/main/java/net/siteed/audiostudio/AudioRecorderManager.kt +2163 -0
- package/android/src/main/java/net/siteed/audiostudio/AudioRecordingService.kt +167 -0
- package/android/src/main/java/net/siteed/audiostudio/AudioStudioModule.kt +1112 -0
- package/android/src/main/java/net/siteed/audiostudio/AudioTrimmer.kt +1099 -0
- package/android/src/main/java/net/siteed/audiostudio/Constants.kt +37 -0
- package/android/src/main/java/net/siteed/audiostudio/EventSender.kt +7 -0
- package/android/src/main/java/net/siteed/audiostudio/FFT.kt +100 -0
- package/android/src/main/java/net/siteed/audiostudio/Features.kt +98 -0
- package/android/src/main/java/net/siteed/audiostudio/LogUtils.kt +93 -0
- package/android/src/main/java/net/siteed/audiostudio/MelSpectrogramNative.kt +36 -0
- package/android/src/main/java/net/siteed/audiostudio/NotificationConfig.kt +72 -0
- package/android/src/main/java/net/siteed/audiostudio/PermissionUtils.kt +68 -0
- package/android/src/main/java/net/siteed/audiostudio/RecordingActionReceiver.kt +59 -0
- package/android/src/main/java/net/siteed/audiostudio/RecordingConfig.kt +259 -0
- package/android/src/main/java/net/siteed/audiostudio/WaveformConfig.kt +19 -0
- package/android/src/main/java/net/siteed/audiostudio/WaveformRenderer.kt +159 -0
- package/android/src/main/jni/AudioFeaturesJNI.cpp +152 -0
- package/android/src/main/jni/MelSpectrogramJNI.cpp +165 -0
- package/android/src/main/res/drawable/ic_default_action_icon.xml +16 -0
- package/android/src/main/res/drawable/ic_microphone.xml +13 -0
- package/android/src/main/res/drawable/ic_pause.xml +10 -0
- package/android/src/main/res/drawable/ic_play.xml +10 -0
- package/android/src/main/res/drawable/ic_stop.xml +10 -0
- package/android/src/main/res/layout/notification_recording.xml +37 -0
- package/android/src/test/java/net/siteed/audiostudio/AudioFileHandlerTest.kt +279 -0
- package/android/src/test/java/net/siteed/audiostudio/AudioFocusStrategyTest.kt +249 -0
- package/android/src/test/java/net/siteed/audiostudio/AudioFormatTest.kt +151 -0
- package/android/src/test/java/net/siteed/audiostudio/AudioFormatUtilsTest.kt +273 -0
- package/android/src/test/java/net/siteed/audiostudio/DeviceDisconnectionFallbackUnitTest.kt +140 -0
- package/android/src/test/resources/chorus.wav +0 -0
- package/android/src/test/resources/generate_test_audio.py +94 -0
- package/android/src/test/resources/jfk.wav +0 -0
- package/android/src/test/resources/osr_us_000_0010_8k.wav +0 -0
- package/android/src/test/resources/recorder_hello_world.wav +0 -0
- package/app.plugin.js +3 -0
- package/build/cjs/AudioAnalysis/AudioAnalysis.types.js +4 -0
- package/build/cjs/AudioAnalysis/AudioAnalysis.types.js.map +1 -0
- package/build/cjs/AudioAnalysis/audioFeaturesWasm.js +164 -0
- package/build/cjs/AudioAnalysis/audioFeaturesWasm.js.map +1 -0
- package/build/cjs/AudioAnalysis/extractAudioAnalysis.js +213 -0
- package/build/cjs/AudioAnalysis/extractAudioAnalysis.js.map +1 -0
- package/build/cjs/AudioAnalysis/extractAudioData.js +21 -0
- package/build/cjs/AudioAnalysis/extractAudioData.js.map +1 -0
- package/build/cjs/AudioAnalysis/extractMelSpectrogram.js +90 -0
- package/build/cjs/AudioAnalysis/extractMelSpectrogram.js.map +1 -0
- package/build/cjs/AudioAnalysis/extractPreview.js +28 -0
- package/build/cjs/AudioAnalysis/extractPreview.js.map +1 -0
- package/build/cjs/AudioAnalysis/extractWaveform.js +18 -0
- package/build/cjs/AudioAnalysis/extractWaveform.js.map +1 -0
- package/build/cjs/AudioAnalysis/melSpectrogramWasm.js +149 -0
- package/build/cjs/AudioAnalysis/melSpectrogramWasm.js.map +1 -0
- package/build/cjs/AudioDeviceManager.js +688 -0
- package/build/cjs/AudioDeviceManager.js.map +1 -0
- package/build/cjs/AudioRecorder.provider.js +78 -0
- package/build/cjs/AudioRecorder.provider.js.map +1 -0
- package/build/cjs/AudioStudio.native.js +8 -0
- package/build/cjs/AudioStudio.native.js.map +1 -0
- package/build/cjs/AudioStudio.types.js +11 -0
- package/build/cjs/AudioStudio.types.js.map +1 -0
- package/build/cjs/AudioStudio.web.js +708 -0
- package/build/cjs/AudioStudio.web.js.map +1 -0
- package/build/cjs/AudioStudioModule.js +718 -0
- package/build/cjs/AudioStudioModule.js.map +1 -0
- package/build/cjs/WebRecorder.web.js +865 -0
- package/build/cjs/WebRecorder.web.js.map +1 -0
- package/build/cjs/constants/platformLimitations.js +99 -0
- package/build/cjs/constants/platformLimitations.js.map +1 -0
- package/build/cjs/constants.js +20 -0
- package/build/cjs/constants.js.map +1 -0
- package/build/cjs/events.js +29 -0
- package/build/cjs/events.js.map +1 -0
- package/build/cjs/hooks/useAudioDevices.js +179 -0
- package/build/cjs/hooks/useAudioDevices.js.map +1 -0
- package/build/cjs/index.js +64 -0
- package/build/cjs/index.js.map +1 -0
- package/build/cjs/trimAudio.js +76 -0
- package/build/cjs/trimAudio.js.map +1 -0
- package/build/cjs/useAudioRecorder.js +535 -0
- package/build/cjs/useAudioRecorder.js.map +1 -0
- package/build/cjs/utils/BlobFix.js +502 -0
- package/build/cjs/utils/BlobFix.js.map +1 -0
- package/build/cjs/utils/audioProcessing.js +136 -0
- package/build/cjs/utils/audioProcessing.js.map +1 -0
- package/build/cjs/utils/cleanNativeOptions.js +22 -0
- package/build/cjs/utils/cleanNativeOptions.js.map +1 -0
- package/build/cjs/utils/concatenateBuffers.js +25 -0
- package/build/cjs/utils/concatenateBuffers.js.map +1 -0
- package/build/cjs/utils/convertPCMToFloat32.js +124 -0
- package/build/cjs/utils/convertPCMToFloat32.js.map +1 -0
- package/build/cjs/utils/crc32.js +52 -0
- package/build/cjs/utils/crc32.js.map +1 -0
- package/build/cjs/utils/encodingToBitDepth.js +17 -0
- package/build/cjs/utils/encodingToBitDepth.js.map +1 -0
- package/build/cjs/utils/getWavFileInfo.js +96 -0
- package/build/cjs/utils/getWavFileInfo.js.map +1 -0
- package/build/cjs/utils/writeWavHeader.js +88 -0
- package/build/cjs/utils/writeWavHeader.js.map +1 -0
- package/build/cjs/workers/InlineFeaturesExtractor.web.js +294 -0
- package/build/cjs/workers/InlineFeaturesExtractor.web.js.map +1 -0
- package/build/cjs/workers/inlineAudioWebWorker.web.js +190 -0
- package/build/cjs/workers/inlineAudioWebWorker.web.js.map +1 -0
- package/build/cjs/workers/wasmGlueString.web.js +27 -0
- package/build/cjs/workers/wasmGlueString.web.js.map +1 -0
- package/build/esm/AudioAnalysis/AudioAnalysis.types.js +3 -0
- package/build/esm/AudioAnalysis/AudioAnalysis.types.js.map +1 -0
- package/build/esm/AudioAnalysis/audioFeaturesWasm.js +126 -0
- package/build/esm/AudioAnalysis/audioFeaturesWasm.js.map +1 -0
- package/build/esm/AudioAnalysis/extractAudioAnalysis.js +205 -0
- package/build/esm/AudioAnalysis/extractAudioAnalysis.js.map +1 -0
- package/build/esm/AudioAnalysis/extractAudioData.js +14 -0
- package/build/esm/AudioAnalysis/extractAudioData.js.map +1 -0
- package/build/esm/AudioAnalysis/extractMelSpectrogram.js +86 -0
- package/build/esm/AudioAnalysis/extractMelSpectrogram.js.map +1 -0
- package/build/esm/AudioAnalysis/extractPreview.js +25 -0
- package/build/esm/AudioAnalysis/extractPreview.js.map +1 -0
- package/build/esm/AudioAnalysis/extractWaveform.js +11 -0
- package/build/esm/AudioAnalysis/extractWaveform.js.map +1 -0
- package/build/esm/AudioAnalysis/melSpectrogramWasm.js +111 -0
- package/build/esm/AudioAnalysis/melSpectrogramWasm.js.map +1 -0
- package/build/esm/AudioDeviceManager.js +681 -0
- package/build/esm/AudioDeviceManager.js.map +1 -0
- package/build/esm/AudioRecorder.provider.js +40 -0
- package/build/esm/AudioRecorder.provider.js.map +1 -0
- package/build/esm/AudioStudio.native.js +6 -0
- package/build/esm/AudioStudio.native.js.map +1 -0
- package/build/esm/AudioStudio.types.js +8 -0
- package/build/esm/AudioStudio.types.js.map +1 -0
- package/build/esm/AudioStudio.web.js +704 -0
- package/build/esm/AudioStudio.web.js.map +1 -0
- package/build/esm/AudioStudioModule.js +713 -0
- package/build/esm/AudioStudioModule.js.map +1 -0
- package/build/esm/WebRecorder.web.js +861 -0
- package/build/esm/WebRecorder.web.js.map +1 -0
- package/build/esm/constants/platformLimitations.js +90 -0
- package/build/esm/constants/platformLimitations.js.map +1 -0
- package/build/esm/constants.js +17 -0
- package/build/esm/constants.js.map +1 -0
- package/build/esm/events.js +21 -0
- package/build/esm/events.js.map +1 -0
- package/build/esm/hooks/useAudioDevices.js +176 -0
- package/build/esm/hooks/useAudioDevices.js.map +1 -0
- package/build/esm/index.js +23 -0
- package/build/esm/index.js.map +1 -0
- package/build/esm/trimAudio.js +69 -0
- package/build/esm/trimAudio.js.map +1 -0
- package/build/esm/useAudioRecorder.js +529 -0
- package/build/esm/useAudioRecorder.js.map +1 -0
- package/build/esm/utils/BlobFix.js +498 -0
- package/build/esm/utils/BlobFix.js.map +1 -0
- package/build/esm/utils/audioProcessing.js +133 -0
- package/build/esm/utils/audioProcessing.js.map +1 -0
- package/build/esm/utils/cleanNativeOptions.js +19 -0
- package/build/esm/utils/cleanNativeOptions.js.map +1 -0
- package/build/esm/utils/concatenateBuffers.js +21 -0
- package/build/esm/utils/concatenateBuffers.js.map +1 -0
- package/build/esm/utils/convertPCMToFloat32.js +120 -0
- package/build/esm/utils/convertPCMToFloat32.js.map +1 -0
- package/build/esm/utils/crc32.js +50 -0
- package/build/esm/utils/crc32.js.map +1 -0
- package/build/esm/utils/encodingToBitDepth.js +13 -0
- package/build/esm/utils/encodingToBitDepth.js.map +1 -0
- package/build/esm/utils/getWavFileInfo.js +92 -0
- package/build/esm/utils/getWavFileInfo.js.map +1 -0
- package/build/esm/utils/writeWavHeader.js +84 -0
- package/build/esm/utils/writeWavHeader.js.map +1 -0
- package/build/esm/workers/InlineFeaturesExtractor.web.js +291 -0
- package/build/esm/workers/InlineFeaturesExtractor.web.js.map +1 -0
- package/build/esm/workers/inlineAudioWebWorker.web.js +187 -0
- package/build/esm/workers/inlineAudioWebWorker.web.js.map +1 -0
- package/build/esm/workers/wasmGlueString.web.js +24 -0
- package/build/esm/workers/wasmGlueString.web.js.map +1 -0
- package/build/types/AudioAnalysis/AudioAnalysis.types.d.ts +198 -0
- package/build/types/AudioAnalysis/AudioAnalysis.types.d.ts.map +1 -0
- package/build/types/AudioAnalysis/audioFeaturesWasm.d.ts +24 -0
- package/build/types/AudioAnalysis/audioFeaturesWasm.d.ts.map +1 -0
- package/build/types/AudioAnalysis/extractAudioAnalysis.d.ts +74 -0
- package/build/types/AudioAnalysis/extractAudioAnalysis.d.ts.map +1 -0
- package/build/types/AudioAnalysis/extractAudioData.d.ts +3 -0
- package/build/types/AudioAnalysis/extractAudioData.d.ts.map +1 -0
- package/build/types/AudioAnalysis/extractMelSpectrogram.d.ts +20 -0
- package/build/types/AudioAnalysis/extractMelSpectrogram.d.ts.map +1 -0
- package/build/types/AudioAnalysis/extractPreview.d.ts +11 -0
- package/build/types/AudioAnalysis/extractPreview.d.ts.map +1 -0
- package/build/types/AudioAnalysis/extractWaveform.d.ts +8 -0
- package/build/types/AudioAnalysis/extractWaveform.d.ts.map +1 -0
- package/build/types/AudioAnalysis/melSpectrogramWasm.d.ts +16 -0
- package/build/types/AudioAnalysis/melSpectrogramWasm.d.ts.map +1 -0
- package/build/types/AudioDeviceManager.d.ts +187 -0
- package/build/types/AudioDeviceManager.d.ts.map +1 -0
- package/build/types/AudioRecorder.provider.d.ts +11 -0
- package/build/types/AudioRecorder.provider.d.ts.map +1 -0
- package/build/types/AudioStudio.native.d.ts +3 -0
- package/build/types/AudioStudio.native.d.ts.map +1 -0
- package/build/types/AudioStudio.types.d.ts +760 -0
- package/build/types/AudioStudio.types.d.ts.map +1 -0
- package/build/types/AudioStudio.web.d.ts +96 -0
- package/build/types/AudioStudio.web.d.ts.map +1 -0
- package/build/types/AudioStudioModule.d.ts +3 -0
- package/build/types/AudioStudioModule.d.ts.map +1 -0
- package/build/types/WebRecorder.web.d.ts +208 -0
- package/build/types/WebRecorder.web.d.ts.map +1 -0
- package/build/types/constants/platformLimitations.d.ts +40 -0
- package/build/types/constants/platformLimitations.d.ts.map +1 -0
- package/build/types/constants.d.ts +14 -0
- package/build/types/constants.d.ts.map +1 -0
- package/build/types/events.d.ts +29 -0
- package/build/types/events.d.ts.map +1 -0
- package/build/types/hooks/useAudioDevices.d.ts +15 -0
- package/build/types/hooks/useAudioDevices.d.ts.map +1 -0
- package/build/types/index.d.ts +21 -0
- package/build/types/index.d.ts.map +1 -0
- package/build/types/trimAudio.d.ts +25 -0
- package/build/types/trimAudio.d.ts.map +1 -0
- package/build/types/useAudioRecorder.d.ts +22 -0
- package/build/types/useAudioRecorder.d.ts.map +1 -0
- package/build/types/utils/BlobFix.d.ts +9 -0
- package/build/types/utils/BlobFix.d.ts.map +1 -0
- package/build/types/utils/audioProcessing.d.ts +24 -0
- package/build/types/utils/audioProcessing.d.ts.map +1 -0
- package/build/types/utils/cleanNativeOptions.d.ts +15 -0
- package/build/types/utils/cleanNativeOptions.d.ts.map +1 -0
- package/build/types/utils/concatenateBuffers.d.ts +8 -0
- package/build/types/utils/concatenateBuffers.d.ts.map +1 -0
- package/build/types/utils/convertPCMToFloat32.d.ts +13 -0
- package/build/types/utils/convertPCMToFloat32.d.ts.map +1 -0
- package/build/types/utils/crc32.d.ts +7 -0
- package/build/types/utils/crc32.d.ts.map +1 -0
- package/build/types/utils/encodingToBitDepth.d.ts +5 -0
- package/build/types/utils/encodingToBitDepth.d.ts.map +1 -0
- package/build/types/utils/getWavFileInfo.d.ts +26 -0
- package/build/types/utils/getWavFileInfo.d.ts.map +1 -0
- package/build/types/utils/writeWavHeader.d.ts +34 -0
- package/build/types/utils/writeWavHeader.d.ts.map +1 -0
- package/build/types/workers/InlineFeaturesExtractor.web.d.ts +2 -0
- package/build/types/workers/InlineFeaturesExtractor.web.d.ts.map +1 -0
- package/build/types/workers/inlineAudioWebWorker.web.d.ts +2 -0
- package/build/types/workers/inlineAudioWebWorker.web.d.ts.map +1 -0
- package/build/types/workers/wasmGlueString.web.d.ts +2 -0
- package/build/types/workers/wasmGlueString.web.d.ts.map +1 -0
- package/cpp/AudioFeatures.cpp +274 -0
- package/cpp/AudioFeatures.h +85 -0
- package/cpp/AudioFeaturesBridge.cpp +146 -0
- package/cpp/AudioFeaturesBridge.h +47 -0
- package/cpp/MelSpectrogram.cpp +227 -0
- package/cpp/MelSpectrogram.h +82 -0
- package/cpp/MelSpectrogramBridge.cpp +112 -0
- package/cpp/MelSpectrogramBridge.h +33 -0
- package/cpp/kiss_fft/COPYING +11 -0
- package/cpp/kiss_fft/_kiss_fft_guts.h +167 -0
- package/cpp/kiss_fft/kiss_fft.c +424 -0
- package/cpp/kiss_fft/kiss_fft.h +160 -0
- package/cpp/kiss_fft/kiss_fft_log.h +36 -0
- package/cpp/kiss_fft/kiss_fftr.c +155 -0
- package/cpp/kiss_fft/kiss_fftr.h +54 -0
- package/expo-module.config.json +10 -0
- package/ios/AudioAnalysisData.swift +74 -0
- package/ios/AudioDeviceManager.swift +670 -0
- package/ios/AudioFeaturesWrapper.h +21 -0
- package/ios/AudioFeaturesWrapper.mm +63 -0
- package/ios/AudioNotificationManager.swift +154 -0
- package/ios/AudioProcessingHelpers.swift +797 -0
- package/ios/AudioProcessor.swift +1191 -0
- package/ios/AudioStreamError.swift +7 -0
- package/ios/AudioStreamManager.swift +2369 -0
- package/ios/AudioStreamManagerDelegate.swift +16 -0
- package/ios/AudioStudio.podspec +39 -0
- package/ios/AudioStudioModule.swift +1111 -0
- package/ios/AudioStudioTests/AudioFileHandlerTests.swift +338 -0
- package/ios/AudioStudioTests/AudioFormatUtilsTests.swift +331 -0
- package/ios/AudioStudioTests/AudioTestHelpers.swift +130 -0
- package/ios/AudioStudioTests/CompressedOnlyOutputTests.swift +294 -0
- package/ios/AudioStudioTests/EventEmissionIntervalTests.swift +105 -0
- package/ios/AudioStudioTests/Info.plist +22 -0
- package/ios/AudioStudioTests/README.md +39 -0
- package/ios/AudioStudioTests/SimpleAudioTest.swift +98 -0
- package/ios/AudioStudioTests/TestAudioGenerator.swift +75 -0
- package/ios/DataPoint.swift +54 -0
- package/ios/DecodingConfig.swift +59 -0
- package/ios/FFT.swift +62 -0
- package/ios/Features.swift +95 -0
- package/ios/ISSUE_IOS.md +68 -0
- package/ios/Logger.swift +39 -0
- package/ios/MelSpectrogramWrapper.h +30 -0
- package/ios/MelSpectrogramWrapper.mm +97 -0
- package/ios/NotificationExtension.swift +15 -0
- package/ios/RecordingResult.swift +22 -0
- package/ios/RecordingSettings.swift +311 -0
- package/ios/WaveformExtractor.swift +105 -0
- package/ios/tests/README.md +41 -0
- package/ios/tests/integration/buffer_and_fallback_test.swift +178 -0
- package/ios/tests/integration/buffer_duration_test.swift +185 -0
- package/ios/tests/integration/compressed_only_output_test.swift +271 -0
- package/ios/tests/integration/output_control_test.swift +322 -0
- package/ios/tests/integration/run_integration_tests.sh +37 -0
- package/ios/tests/opus_support_test_macos.swift +154 -0
- package/ios/tests/standalone/audio_processing_test.swift +144 -0
- package/ios/tests/standalone/audio_recording_test.swift +277 -0
- package/ios/tests/standalone/audio_streaming_test.swift +249 -0
- package/ios/tests/standalone/standalone_test.swift +144 -0
- package/package.json +146 -0
- package/plugin/build/index.cjs +194 -0
- package/plugin/build/index.d.cts +22 -0
- package/plugin/build/index.js +194 -0
- package/plugin/src/index.ts +285 -0
- package/plugin/tsconfig.json +10 -0
- package/plugin/tsconfig.tsbuildinfo +1 -0
- package/prebuilt/wasm/mel-spectrogram.js +18 -0
- package/src/AudioAnalysis/AudioAnalysis.types.ts +226 -0
- package/src/AudioAnalysis/audio-features-wasm.d.ts +37 -0
- package/src/AudioAnalysis/audioFeaturesWasm.ts +200 -0
- package/src/AudioAnalysis/extractAudioAnalysis.ts +350 -0
- package/src/AudioAnalysis/extractAudioData.ts +17 -0
- package/src/AudioAnalysis/extractMelSpectrogram.ts +140 -0
- package/src/AudioAnalysis/extractPreview.ts +34 -0
- package/src/AudioAnalysis/extractWaveform.ts +22 -0
- package/src/AudioAnalysis/mel-spectrogram-wasm.d.ts +48 -0
- package/src/AudioAnalysis/melSpectrogramWasm.ts +179 -0
- package/src/AudioDeviceManager.ts +800 -0
- package/src/AudioRecorder.provider.tsx +57 -0
- package/src/AudioStudio.native.ts +6 -0
- package/src/AudioStudio.types.ts +899 -0
- package/src/AudioStudio.web.ts +911 -0
- package/src/AudioStudioModule.ts +984 -0
- package/src/WebRecorder.web.ts +1114 -0
- package/src/constants/platformLimitations.ts +118 -0
- package/src/constants.ts +21 -0
- package/src/events.ts +63 -0
- package/src/hooks/useAudioDevices.ts +213 -0
- package/src/index.ts +67 -0
- package/src/trimAudio.ts +94 -0
- package/src/types/crc-32.d.ts +9 -0
- package/src/useAudioRecorder.tsx +784 -0
- package/src/utils/BlobFix.ts +561 -0
- package/src/utils/audioProcessing.ts +205 -0
- package/src/utils/cleanNativeOptions.ts +18 -0
- package/src/utils/concatenateBuffers.ts +24 -0
- package/src/utils/convertPCMToFloat32.ts +170 -0
- package/src/utils/crc32.ts +59 -0
- package/src/utils/encodingToBitDepth.ts +18 -0
- package/src/utils/getWavFileInfo.ts +132 -0
- package/src/utils/writeWavHeader.ts +115 -0
- package/src/workers/InlineFeaturesExtractor.web.tsx +291 -0
- package/src/workers/inlineAudioWebWorker.web.tsx +186 -0
- package/src/workers/wasmGlueString.web.ts +23 -0
|
@@ -0,0 +1,96 @@
|
|
|
1
|
+
"use strict";
|
|
2
|
+
// packages/audio-studio/src/utils/getWavFileInfo.ts
|
|
3
|
+
Object.defineProperty(exports, "__esModule", { value: true });
|
|
4
|
+
exports.getWavFileInfo = void 0;
|
|
5
|
+
const constants_1 = require("../constants");
|
|
6
|
+
// Audio format descriptions
|
|
7
|
+
const AUDIO_FORMATS = {
|
|
8
|
+
1: 'PCM',
|
|
9
|
+
3: 'IEEE float',
|
|
10
|
+
6: '8-bit ITU-T G.711 A-law',
|
|
11
|
+
7: '8-bit ITU-T G.711 µ-law',
|
|
12
|
+
65534: 'WAVE_FORMAT_EXTENSIBLE',
|
|
13
|
+
};
|
|
14
|
+
/**
|
|
15
|
+
* Extracts metadata from a WAV buffer.
|
|
16
|
+
*
|
|
17
|
+
* @param arrayBuffer - The array buffer containing the WAV data.
|
|
18
|
+
* @returns A promise that resolves to the extracted metadata.
|
|
19
|
+
*/
|
|
20
|
+
const getWavFileInfo = async (arrayBuffer) => {
|
|
21
|
+
const view = new DataView(arrayBuffer);
|
|
22
|
+
// Check if the file is a valid RIFF/WAVE file
|
|
23
|
+
const riffHeader = view.getUint32(0, false);
|
|
24
|
+
const waveHeader = view.getUint32(8, false);
|
|
25
|
+
if (riffHeader !== constants_1.RIFF_HEADER || waveHeader !== constants_1.WAVE_HEADER) {
|
|
26
|
+
throw new Error('Invalid WAV file');
|
|
27
|
+
}
|
|
28
|
+
// Initialize variables for the metadata
|
|
29
|
+
let fmtChunkOffset = 12;
|
|
30
|
+
let sampleRate = constants_1.DEFAULT_SAMPLE_RATE;
|
|
31
|
+
let numChannels = 0;
|
|
32
|
+
let bitDepth = constants_1.DEFAULT_BIT_DEPTH;
|
|
33
|
+
let dataChunkSize = 0;
|
|
34
|
+
let audioFormat = 0;
|
|
35
|
+
let byteRate = 0;
|
|
36
|
+
let blockAlign = 0;
|
|
37
|
+
let creationDateTime = '';
|
|
38
|
+
let comments = '';
|
|
39
|
+
let dataChunkOffset = 0;
|
|
40
|
+
// Parse chunks to find the "fmt " and "data" chunks
|
|
41
|
+
while (fmtChunkOffset < view.byteLength) {
|
|
42
|
+
const chunkId = view.getUint32(fmtChunkOffset, false);
|
|
43
|
+
const chunkSize = view.getUint32(fmtChunkOffset + 4, true);
|
|
44
|
+
if (chunkId === constants_1.FMT_CHUNK_ID) {
|
|
45
|
+
// "fmt "
|
|
46
|
+
audioFormat = view.getUint16(fmtChunkOffset + 8, true);
|
|
47
|
+
if (!AUDIO_FORMATS[audioFormat]) {
|
|
48
|
+
throw new Error('Unsupported WAV file format');
|
|
49
|
+
}
|
|
50
|
+
numChannels = view.getUint16(fmtChunkOffset + 10, true);
|
|
51
|
+
sampleRate = view.getUint32(fmtChunkOffset + 12, true);
|
|
52
|
+
byteRate = view.getUint32(fmtChunkOffset + 16, true);
|
|
53
|
+
blockAlign = view.getUint16(fmtChunkOffset + 20, true);
|
|
54
|
+
bitDepth = view.getUint16(fmtChunkOffset + 22, true);
|
|
55
|
+
}
|
|
56
|
+
else if (chunkId === constants_1.DATA_CHUNK_ID) {
|
|
57
|
+
// "data"
|
|
58
|
+
dataChunkSize = chunkSize;
|
|
59
|
+
dataChunkOffset = fmtChunkOffset + 8; // Position after chunk header
|
|
60
|
+
break;
|
|
61
|
+
}
|
|
62
|
+
else if (chunkId === constants_1.INFO_CHUNK_ID) {
|
|
63
|
+
// "INFO"
|
|
64
|
+
// Read INFO chunk (assuming it contains a text-based creation date/time and comments)
|
|
65
|
+
const infoStart = fmtChunkOffset + 8;
|
|
66
|
+
const infoText = new TextDecoder().decode(new Uint8Array(arrayBuffer.slice(infoStart, infoStart + chunkSize)));
|
|
67
|
+
const infoParts = infoText.split('\0');
|
|
68
|
+
creationDateTime = infoParts[0];
|
|
69
|
+
comments = infoParts[1];
|
|
70
|
+
}
|
|
71
|
+
fmtChunkOffset += 8 + chunkSize;
|
|
72
|
+
}
|
|
73
|
+
if (!sampleRate || !numChannels || !bitDepth || !dataChunkSize) {
|
|
74
|
+
throw new Error('Incomplete WAV file information');
|
|
75
|
+
}
|
|
76
|
+
// Calculate duration
|
|
77
|
+
const bytesPerSample = bitDepth / 8;
|
|
78
|
+
const numSamples = dataChunkSize / (numChannels * bytesPerSample);
|
|
79
|
+
const durationMs = (numSamples / sampleRate) * 1000;
|
|
80
|
+
return {
|
|
81
|
+
sampleRate,
|
|
82
|
+
numChannels,
|
|
83
|
+
bitDepth,
|
|
84
|
+
size: arrayBuffer.byteLength,
|
|
85
|
+
durationMs,
|
|
86
|
+
audioFormatDescription: AUDIO_FORMATS[audioFormat],
|
|
87
|
+
byteRate,
|
|
88
|
+
blockAlign,
|
|
89
|
+
creationDateTime: creationDateTime || undefined,
|
|
90
|
+
comments: comments || undefined,
|
|
91
|
+
compressionType: audioFormat === 1 ? 'None' : AUDIO_FORMATS[audioFormat],
|
|
92
|
+
dataChunkOffset,
|
|
93
|
+
};
|
|
94
|
+
};
|
|
95
|
+
exports.getWavFileInfo = getWavFileInfo;
|
|
96
|
+
//# sourceMappingURL=getWavFileInfo.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"getWavFileInfo.js","sourceRoot":"","sources":["../../../src/utils/getWavFileInfo.ts"],"names":[],"mappings":";AAAA,oDAAoD;;;AAGpD,4CAQqB;AAErB,4BAA4B;AAC5B,MAAM,aAAa,GAA8B;IAC7C,CAAC,EAAE,KAAK;IACR,CAAC,EAAE,YAAY;IACf,CAAC,EAAE,yBAAyB;IAC5B,CAAC,EAAE,yBAAyB;IAC5B,KAAK,EAAE,wBAAwB;CAClC,CAAA;AAoBD;;;;;GAKG;AACI,MAAM,cAAc,GAAG,KAAK,EAC/B,WAAwB,EACJ,EAAE;IACtB,MAAM,IAAI,GAAG,IAAI,QAAQ,CAAC,WAAW,CAAC,CAAA;IAEtC,8CAA8C;IAC9C,MAAM,UAAU,GAAG,IAAI,CAAC,SAAS,CAAC,CAAC,EAAE,KAAK,CAAC,CAAA;IAC3C,MAAM,UAAU,GAAG,IAAI,CAAC,SAAS,CAAC,CAAC,EAAE,KAAK,CAAC,CAAA;IAC3C,IAAI,UAAU,KAAK,uBAAW,IAAI,UAAU,KAAK,uBAAW,EAAE,CAAC;QAC3D,MAAM,IAAI,KAAK,CAAC,kBAAkB,CAAC,CAAA;IACvC,CAAC;IAED,wCAAwC;IACxC,IAAI,cAAc,GAAG,EAAE,CAAA;IACvB,IAAI,UAAU,GAAe,+BAAmB,CAAA;IAChD,IAAI,WAAW,GAAG,CAAC,CAAA;IACnB,IAAI,QAAQ,GAAa,6BAAiB,CAAA;IAC1C,IAAI,aAAa,GAAG,CAAC,CAAA;IACrB,IAAI,WAAW,GAAG,CAAC,CAAA;IACnB,IAAI,QAAQ,GAAG,CAAC,CAAA;IAChB,IAAI,UAAU,GAAG,CAAC,CAAA;IAClB,IAAI,gBAAgB,GAAG,EAAE,CAAA;IACzB,IAAI,QAAQ,GAAG,EAAE,CAAA;IACjB,IAAI,eAAe,GAAG,CAAC,CAAA;IAEvB,oDAAoD;IACpD,OAAO,cAAc,GAAG,IAAI,CAAC,UAAU,EAAE,CAAC;QACtC,MAAM,OAAO,GAAG,IAAI,CAAC,SAAS,CAAC,cAAc,EAAE,KAAK,CAAC,CAAA;QACrD,MAAM,SAAS,GAAG,IAAI,CAAC,SAAS,CAAC,cAAc,GAAG,CAAC,EAAE,IAAI,CAAC,CAAA;QAC1D,IAAI,OAAO,KAAK,wBAAY,EAAE,CAAC;YAC3B,SAAS;YACT,WAAW,GAAG,IAAI,CAAC,SAAS,CAAC,cAAc,GAAG,CAAC,EAAE,IAAI,CAAC,CAAA;YACtD,IAAI,CAAC,aAAa,CAAC,WAAW,CAAC,EAAE,CAAC;gBAC9B,MAAM,IAAI,KAAK,CAAC,6BAA6B,CAAC,CAAA;YAClD,CAAC;YACD,WAAW,GAAG,IAAI,CAAC,SAAS,CAAC,cAAc,GAAG,EAAE,EAAE,IAAI,CAAC,CAAA;YACvD,UAAU,GAAG,IAAI,CAAC,SAAS,CAAC,cAAc,GAAG,EAAE,EAAE,IAAI,CAAe,CAAA;YACpE,QAAQ,GAAG,IAAI,CAAC,SAAS,CAAC,cAAc,GAAG,EAAE,EAAE,IAAI,CAAC,CAAA;YACpD,UAAU,GAAG,IAAI,CAAC,SAAS,CAAC,cAAc,GAAG,EAAE,EAAE,IAAI,CAAC,CAAA;YACtD,QAAQ,GAAG,IAAI,CAAC,SAAS,CAAC,cAAc,GAAG,EAAE,EAAE,IAAI,CAAa,CAAA;QACpE,CAAC;aAAM,IAAI,OAAO,KAAK,yBAAa,EAAE,CAAC;YACnC,SAAS;YACT,aAAa,GAAG,SAAS,CAAA;YACzB,eAAe,GAAG,cAAc,GAAG,CAAC,CAAA,CAAC,8BAA8B;YACnE,MAAK;QACT,CAAC;aAAM,IAAI,OAAO,KAAK,yBAAa,EAAE,CAAC;YACnC,SAAS;YACT,sFAAsF;YACtF,MAAM,SAAS,GAAG,cAAc,GAAG,CAAC,CAAA;YACpC,MAAM,QAAQ,GAAG,IAAI,WAAW,EAAE,CAAC,MAAM,CACrC,IAAI,UAAU,CACV,WAAW,CAAC,KAAK,CAAC,SAAS,EAAE,SAAS,GAAG,SAAS,CAAC,CACtD,CACJ,CAAA;YACD,MAAM,SAAS,GAAG,QAAQ,CAAC,KAAK,CAAC,IAAI,CAAC,CAAA;YACtC,gBAAgB,GAAG,SAAS,CAAC,CAAC,CAAC,CAAA;YAC/B,QAAQ,GAAG,SAAS,CAAC,CAAC,CAAC,CAAA;QAC3B,CAAC;QACD,cAAc,IAAI,CAAC,GAAG,SAAS,CAAA;IACnC,CAAC;IAED,IAAI,CAAC,UAAU,IAAI,CAAC,WAAW,IAAI,CAAC,QAAQ,IAAI,CAAC,aAAa,EAAE,CAAC;QAC7D,MAAM,IAAI,KAAK,CAAC,iCAAiC,CAAC,CAAA;IACtD,CAAC;IAED,qBAAqB;IACrB,MAAM,cAAc,GAAG,QAAQ,GAAG,CAAC,CAAA;IACnC,MAAM,UAAU,GAAG,aAAa,GAAG,CAAC,WAAW,GAAG,cAAc,CAAC,CAAA;IACjE,MAAM,UAAU,GAAG,CAAC,UAAU,GAAG,UAAU,CAAC,GAAG,IAAI,CAAA;IAEnD,OAAO;QACH,UAAU;QACV,WAAW;QACX,QAAQ;QACR,IAAI,EAAE,WAAW,CAAC,UAAU;QAC5B,UAAU;QACV,sBAAsB,EAAE,aAAa,CAAC,WAAW,CAAC;QAClD,QAAQ;QACR,UAAU;QACV,gBAAgB,EAAE,gBAAgB,IAAI,SAAS;QAC/C,QAAQ,EAAE,QAAQ,IAAI,SAAS;QAC/B,eAAe,EACX,WAAW,KAAK,CAAC,CAAC,CAAC,CAAC,MAAM,CAAC,CAAC,CAAC,aAAa,CAAC,WAAW,CAAC;QAC3D,eAAe;KAClB,CAAA;AACL,CAAC,CAAA;AArFY,QAAA,cAAc,kBAqF1B","sourcesContent":["// packages/audio-studio/src/utils/getWavFileInfo.ts\n\nimport { BitDepth, SampleRate } from '../AudioStudio.types'\nimport {\n DATA_CHUNK_ID,\n DEFAULT_BIT_DEPTH,\n DEFAULT_SAMPLE_RATE,\n FMT_CHUNK_ID,\n INFO_CHUNK_ID,\n RIFF_HEADER,\n WAVE_HEADER,\n} from '../constants'\n\n// Audio format descriptions\nconst AUDIO_FORMATS: { [key: number]: string } = {\n 1: 'PCM',\n 3: 'IEEE float',\n 6: '8-bit ITU-T G.711 A-law',\n 7: '8-bit ITU-T G.711 µ-law',\n 65534: 'WAVE_FORMAT_EXTENSIBLE',\n}\n\n/**\n * Interface representing the metadata of a WAV file.\n */\nexport interface WavFileInfo {\n sampleRate: SampleRate\n numChannels: number\n bitDepth: BitDepth\n size: number // in bytes\n durationMs: number // in ms\n audioFormatDescription: string // Description of the audio format\n byteRate: number // Average bytes per second\n blockAlign: number // Number of bytes for one sample including all channels\n creationDateTime?: string // Optional creation date and time\n comments?: string // Optional comments or tags\n compressionType?: string // Optional compression type\n dataChunkOffset: number // Position of the first data chunk\n}\n\n/**\n * Extracts metadata from a WAV buffer.\n *\n * @param arrayBuffer - The array buffer containing the WAV data.\n * @returns A promise that resolves to the extracted metadata.\n */\nexport const getWavFileInfo = async (\n arrayBuffer: ArrayBuffer\n): Promise<WavFileInfo> => {\n const view = new DataView(arrayBuffer)\n\n // Check if the file is a valid RIFF/WAVE file\n const riffHeader = view.getUint32(0, false)\n const waveHeader = view.getUint32(8, false)\n if (riffHeader !== RIFF_HEADER || waveHeader !== WAVE_HEADER) {\n throw new Error('Invalid WAV file')\n }\n\n // Initialize variables for the metadata\n let fmtChunkOffset = 12\n let sampleRate: SampleRate = DEFAULT_SAMPLE_RATE\n let numChannels = 0\n let bitDepth: BitDepth = DEFAULT_BIT_DEPTH\n let dataChunkSize = 0\n let audioFormat = 0\n let byteRate = 0\n let blockAlign = 0\n let creationDateTime = ''\n let comments = ''\n let dataChunkOffset = 0\n\n // Parse chunks to find the \"fmt \" and \"data\" chunks\n while (fmtChunkOffset < view.byteLength) {\n const chunkId = view.getUint32(fmtChunkOffset, false)\n const chunkSize = view.getUint32(fmtChunkOffset + 4, true)\n if (chunkId === FMT_CHUNK_ID) {\n // \"fmt \"\n audioFormat = view.getUint16(fmtChunkOffset + 8, true)\n if (!AUDIO_FORMATS[audioFormat]) {\n throw new Error('Unsupported WAV file format')\n }\n numChannels = view.getUint16(fmtChunkOffset + 10, true)\n sampleRate = view.getUint32(fmtChunkOffset + 12, true) as SampleRate\n byteRate = view.getUint32(fmtChunkOffset + 16, true)\n blockAlign = view.getUint16(fmtChunkOffset + 20, true)\n bitDepth = view.getUint16(fmtChunkOffset + 22, true) as BitDepth\n } else if (chunkId === DATA_CHUNK_ID) {\n // \"data\"\n dataChunkSize = chunkSize\n dataChunkOffset = fmtChunkOffset + 8 // Position after chunk header\n break\n } else if (chunkId === INFO_CHUNK_ID) {\n // \"INFO\"\n // Read INFO chunk (assuming it contains a text-based creation date/time and comments)\n const infoStart = fmtChunkOffset + 8\n const infoText = new TextDecoder().decode(\n new Uint8Array(\n arrayBuffer.slice(infoStart, infoStart + chunkSize)\n )\n )\n const infoParts = infoText.split('\\0')\n creationDateTime = infoParts[0]\n comments = infoParts[1]\n }\n fmtChunkOffset += 8 + chunkSize\n }\n\n if (!sampleRate || !numChannels || !bitDepth || !dataChunkSize) {\n throw new Error('Incomplete WAV file information')\n }\n\n // Calculate duration\n const bytesPerSample = bitDepth / 8\n const numSamples = dataChunkSize / (numChannels * bytesPerSample)\n const durationMs = (numSamples / sampleRate) * 1000\n\n return {\n sampleRate,\n numChannels,\n bitDepth,\n size: arrayBuffer.byteLength,\n durationMs,\n audioFormatDescription: AUDIO_FORMATS[audioFormat],\n byteRate,\n blockAlign,\n creationDateTime: creationDateTime || undefined,\n comments: comments || undefined,\n compressionType:\n audioFormat === 1 ? 'None' : AUDIO_FORMATS[audioFormat],\n dataChunkOffset,\n }\n}\n"]}
|
|
@@ -0,0 +1,88 @@
|
|
|
1
|
+
"use strict";
|
|
2
|
+
// packages/audio-studio/src/utils/writeWavHeader.ts
|
|
3
|
+
Object.defineProperty(exports, "__esModule", { value: true });
|
|
4
|
+
exports.writeWavHeader = void 0;
|
|
5
|
+
/**
|
|
6
|
+
* Writes or updates a WAV (RIFF) header based on the provided options.
|
|
7
|
+
*
|
|
8
|
+
* This function can be used in three ways:
|
|
9
|
+
* 1. To create a standalone WAV header (when no buffer is provided).
|
|
10
|
+
* 2. To create a WAV header and combine it with existing audio data (when a buffer without a header is provided).
|
|
11
|
+
* 3. To update an existing WAV header in the provided buffer.
|
|
12
|
+
*
|
|
13
|
+
* For streaming audio where the final size is unknown, this function sets the size fields
|
|
14
|
+
* to the maximum 32-bit value (0xFFFFFFFF). These can be updated later using the
|
|
15
|
+
* `updateWavHeaderSize` function once the final size is known.
|
|
16
|
+
*
|
|
17
|
+
* @param options - The options for creating or updating the WAV header.
|
|
18
|
+
* @returns An ArrayBuffer containing the WAV header, or the header combined with the provided audio data.
|
|
19
|
+
*
|
|
20
|
+
* @throws {Error} Throws an error if the provided options are invalid or if the buffer is too small.
|
|
21
|
+
*/
|
|
22
|
+
const writeWavHeader = ({ buffer, sampleRate, numChannels, bitDepth, isFloat = bitDepth === 32, // Default to float for 32-bit
|
|
23
|
+
}) => {
|
|
24
|
+
// For 32-bit float, we use format 3, otherwise format 1 for PCM
|
|
25
|
+
const audioFormat = isFloat ? 3 : 1; // 3 = IEEE float, 1 = PCM
|
|
26
|
+
const bytesPerSample = bitDepth / 8;
|
|
27
|
+
const blockAlign = numChannels * bytesPerSample;
|
|
28
|
+
const byteRate = sampleRate * blockAlign;
|
|
29
|
+
// Function to write a string to the DataView
|
|
30
|
+
const writeString = (view, offset, string) => {
|
|
31
|
+
for (let i = 0; i < string.length; i++) {
|
|
32
|
+
view.setUint8(offset + i, string.charCodeAt(i));
|
|
33
|
+
}
|
|
34
|
+
};
|
|
35
|
+
// Function to write or update the header
|
|
36
|
+
const writeHeader = (view, dataSize = 0xffffffff) => {
|
|
37
|
+
// RIFF chunk descriptor
|
|
38
|
+
writeString(view, 0, 'RIFF'); // ChunkID
|
|
39
|
+
view.setUint32(4, 36 + dataSize, true); // ChunkSize: 4 + (8 + 16) + (8 + dataSize)
|
|
40
|
+
writeString(view, 8, 'WAVE'); // Format
|
|
41
|
+
// "fmt " sub-chunk
|
|
42
|
+
writeString(view, 12, 'fmt '); // Subchunk1ID
|
|
43
|
+
view.setUint32(16, 16, true); // Subchunk1Size (16 for PCM/Float)
|
|
44
|
+
view.setUint16(20, audioFormat, true); // AudioFormat (3 for float, 1 for PCM)
|
|
45
|
+
view.setUint16(22, numChannels, true); // NumChannels
|
|
46
|
+
view.setUint32(24, sampleRate, true); // SampleRate
|
|
47
|
+
view.setUint32(28, byteRate, true); // ByteRate = SampleRate * NumChannels * BitsPerSample/8
|
|
48
|
+
view.setUint16(32, blockAlign, true); // BlockAlign = NumChannels * BitsPerSample/8
|
|
49
|
+
view.setUint16(34, bitDepth, true); // BitsPerSample
|
|
50
|
+
// "data" sub-chunk
|
|
51
|
+
writeString(view, 36, 'data'); // Subchunk2ID
|
|
52
|
+
view.setUint32(40, dataSize, true); // Subchunk2Size = NumSamples * NumChannels * BitsPerSample/8
|
|
53
|
+
};
|
|
54
|
+
if (buffer) {
|
|
55
|
+
// Handle existing buffer
|
|
56
|
+
// Check for minimum size
|
|
57
|
+
if (buffer.byteLength < 44) {
|
|
58
|
+
throw new Error('Buffer is too small to contain a valid WAV header');
|
|
59
|
+
}
|
|
60
|
+
const view = new DataView(buffer);
|
|
61
|
+
// Check if the buffer already has a WAV header by looking for "RIFF" at the start
|
|
62
|
+
const existingHeader = view.getUint32(0, false) === 0x52494646; // "RIFF" in ASCII
|
|
63
|
+
if (existingHeader) {
|
|
64
|
+
// Update the existing header
|
|
65
|
+
writeHeader(view, buffer.byteLength - 44);
|
|
66
|
+
return buffer;
|
|
67
|
+
}
|
|
68
|
+
else {
|
|
69
|
+
// Create a new buffer with header + data
|
|
70
|
+
const newBuffer = new ArrayBuffer(44 + buffer.byteLength);
|
|
71
|
+
const newView = new DataView(newBuffer);
|
|
72
|
+
// Write header to new buffer
|
|
73
|
+
writeHeader(newView, buffer.byteLength);
|
|
74
|
+
// Copy audio data after header
|
|
75
|
+
new Uint8Array(newBuffer).set(new Uint8Array(buffer), 44);
|
|
76
|
+
return newBuffer;
|
|
77
|
+
}
|
|
78
|
+
}
|
|
79
|
+
else {
|
|
80
|
+
// Create standalone header
|
|
81
|
+
const headerBuffer = new ArrayBuffer(44);
|
|
82
|
+
const view = new DataView(headerBuffer);
|
|
83
|
+
writeHeader(view);
|
|
84
|
+
return headerBuffer;
|
|
85
|
+
}
|
|
86
|
+
};
|
|
87
|
+
exports.writeWavHeader = writeWavHeader;
|
|
88
|
+
//# sourceMappingURL=writeWavHeader.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"writeWavHeader.js","sourceRoot":"","sources":["../../../src/utils/writeWavHeader.ts"],"names":[],"mappings":";AAAA,oDAAoD;;;AAkBpD;;;;;;;;;;;;;;;;GAgBG;AACI,MAAM,cAAc,GAAG,CAAC,EAC3B,MAAM,EACN,UAAU,EACV,WAAW,EACX,QAAQ,EACR,OAAO,GAAG,QAAQ,KAAK,EAAE,EAAE,8BAA8B;EAC1C,EAAe,EAAE;IAChC,gEAAgE;IAChE,MAAM,WAAW,GAAG,OAAO,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAA,CAAC,0BAA0B;IAE9D,MAAM,cAAc,GAAG,QAAQ,GAAG,CAAC,CAAA;IACnC,MAAM,UAAU,GAAG,WAAW,GAAG,cAAc,CAAA;IAC/C,MAAM,QAAQ,GAAG,UAAU,GAAG,UAAU,CAAA;IAExC,6CAA6C;IAC7C,MAAM,WAAW,GAAG,CAAC,IAAc,EAAE,MAAc,EAAE,MAAc,EAAE,EAAE;QACnE,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,GAAG,MAAM,CAAC,MAAM,EAAE,CAAC,EAAE,EAAE,CAAC;YACrC,IAAI,CAAC,QAAQ,CAAC,MAAM,GAAG,CAAC,EAAE,MAAM,CAAC,UAAU,CAAC,CAAC,CAAC,CAAC,CAAA;QACnD,CAAC;IACL,CAAC,CAAA;IAED,yCAAyC;IACzC,MAAM,WAAW,GAAG,CAAC,IAAc,EAAE,WAAmB,UAAU,EAAE,EAAE;QAClE,wBAAwB;QACxB,WAAW,CAAC,IAAI,EAAE,CAAC,EAAE,MAAM,CAAC,CAAA,CAAC,UAAU;QACvC,IAAI,CAAC,SAAS,CAAC,CAAC,EAAE,EAAE,GAAG,QAAQ,EAAE,IAAI,CAAC,CAAA,CAAC,2CAA2C;QAClF,WAAW,CAAC,IAAI,EAAE,CAAC,EAAE,MAAM,CAAC,CAAA,CAAC,SAAS;QAEtC,mBAAmB;QACnB,WAAW,CAAC,IAAI,EAAE,EAAE,EAAE,MAAM,CAAC,CAAA,CAAC,cAAc;QAC5C,IAAI,CAAC,SAAS,CAAC,EAAE,EAAE,EAAE,EAAE,IAAI,CAAC,CAAA,CAAC,mCAAmC;QAChE,IAAI,CAAC,SAAS,CAAC,EAAE,EAAE,WAAW,EAAE,IAAI,CAAC,CAAA,CAAC,uCAAuC;QAC7E,IAAI,CAAC,SAAS,CAAC,EAAE,EAAE,WAAW,EAAE,IAAI,CAAC,CAAA,CAAC,cAAc;QACpD,IAAI,CAAC,SAAS,CAAC,EAAE,EAAE,UAAU,EAAE,IAAI,CAAC,CAAA,CAAC,aAAa;QAClD,IAAI,CAAC,SAAS,CAAC,EAAE,EAAE,QAAQ,EAAE,IAAI,CAAC,CAAA,CAAC,wDAAwD;QAC3F,IAAI,CAAC,SAAS,CAAC,EAAE,EAAE,UAAU,EAAE,IAAI,CAAC,CAAA,CAAC,6CAA6C;QAClF,IAAI,CAAC,SAAS,CAAC,EAAE,EAAE,QAAQ,EAAE,IAAI,CAAC,CAAA,CAAC,gBAAgB;QAEnD,mBAAmB;QACnB,WAAW,CAAC,IAAI,EAAE,EAAE,EAAE,MAAM,CAAC,CAAA,CAAC,cAAc;QAC5C,IAAI,CAAC,SAAS,CAAC,EAAE,EAAE,QAAQ,EAAE,IAAI,CAAC,CAAA,CAAC,6DAA6D;IACpG,CAAC,CAAA;IAED,IAAI,MAAM,EAAE,CAAC;QACT,yBAAyB;QAEzB,yBAAyB;QACzB,IAAI,MAAM,CAAC,UAAU,GAAG,EAAE,EAAE,CAAC;YACzB,MAAM,IAAI,KAAK,CAAC,mDAAmD,CAAC,CAAA;QACxE,CAAC;QAED,MAAM,IAAI,GAAG,IAAI,QAAQ,CAAC,MAAM,CAAC,CAAA;QAEjC,kFAAkF;QAClF,MAAM,cAAc,GAAG,IAAI,CAAC,SAAS,CAAC,CAAC,EAAE,KAAK,CAAC,KAAK,UAAU,CAAA,CAAC,kBAAkB;QAEjF,IAAI,cAAc,EAAE,CAAC;YACjB,6BAA6B;YAC7B,WAAW,CAAC,IAAI,EAAE,MAAM,CAAC,UAAU,GAAG,EAAE,CAAC,CAAA;YACzC,OAAO,MAAM,CAAA;QACjB,CAAC;aAAM,CAAC;YACJ,yCAAyC;YACzC,MAAM,SAAS,GAAG,IAAI,WAAW,CAAC,EAAE,GAAG,MAAM,CAAC,UAAU,CAAC,CAAA;YACzD,MAAM,OAAO,GAAG,IAAI,QAAQ,CAAC,SAAS,CAAC,CAAA;YAEvC,6BAA6B;YAC7B,WAAW,CAAC,OAAO,EAAE,MAAM,CAAC,UAAU,CAAC,CAAA;YAEvC,+BAA+B;YAC/B,IAAI,UAAU,CAAC,SAAS,CAAC,CAAC,GAAG,CAAC,IAAI,UAAU,CAAC,MAAM,CAAC,EAAE,EAAE,CAAC,CAAA;YACzD,OAAO,SAAS,CAAA;QACpB,CAAC;IACL,CAAC;SAAM,CAAC;QACJ,2BAA2B;QAC3B,MAAM,YAAY,GAAG,IAAI,WAAW,CAAC,EAAE,CAAC,CAAA;QACxC,MAAM,IAAI,GAAG,IAAI,QAAQ,CAAC,YAAY,CAAC,CAAA;QACvC,WAAW,CAAC,IAAI,CAAC,CAAA;QACjB,OAAO,YAAY,CAAA;IACvB,CAAC;AACL,CAAC,CAAA;AA/EY,QAAA,cAAc,kBA+E1B","sourcesContent":["// packages/audio-studio/src/utils/writeWavHeader.ts\n\n/**\n * Options for creating a WAV header.\n */\nexport interface WavHeaderOptions {\n /** Optional buffer containing audio data. If provided, it will be combined with the header. */\n buffer?: ArrayBuffer\n /** The sample rate of the audio in Hz (e.g., 44100). */\n sampleRate: number\n /** The number of audio channels (e.g., 1 for mono, 2 for stereo). */\n numChannels: number\n /** The bit depth of the audio (e.g., 16, 24, or 32). */\n bitDepth: number\n /** Whether the audio data is in float format (only applies to 32-bit) */\n isFloat?: boolean\n}\n\n/**\n * Writes or updates a WAV (RIFF) header based on the provided options.\n *\n * This function can be used in three ways:\n * 1. To create a standalone WAV header (when no buffer is provided).\n * 2. To create a WAV header and combine it with existing audio data (when a buffer without a header is provided).\n * 3. To update an existing WAV header in the provided buffer.\n *\n * For streaming audio where the final size is unknown, this function sets the size fields\n * to the maximum 32-bit value (0xFFFFFFFF). These can be updated later using the\n * `updateWavHeaderSize` function once the final size is known.\n *\n * @param options - The options for creating or updating the WAV header.\n * @returns An ArrayBuffer containing the WAV header, or the header combined with the provided audio data.\n *\n * @throws {Error} Throws an error if the provided options are invalid or if the buffer is too small.\n */\nexport const writeWavHeader = ({\n buffer,\n sampleRate,\n numChannels,\n bitDepth,\n isFloat = bitDepth === 32, // Default to float for 32-bit\n}: WavHeaderOptions): ArrayBuffer => {\n // For 32-bit float, we use format 3, otherwise format 1 for PCM\n const audioFormat = isFloat ? 3 : 1 // 3 = IEEE float, 1 = PCM\n\n const bytesPerSample = bitDepth / 8\n const blockAlign = numChannels * bytesPerSample\n const byteRate = sampleRate * blockAlign\n\n // Function to write a string to the DataView\n const writeString = (view: DataView, offset: number, string: string) => {\n for (let i = 0; i < string.length; i++) {\n view.setUint8(offset + i, string.charCodeAt(i))\n }\n }\n\n // Function to write or update the header\n const writeHeader = (view: DataView, dataSize: number = 0xffffffff) => {\n // RIFF chunk descriptor\n writeString(view, 0, 'RIFF') // ChunkID\n view.setUint32(4, 36 + dataSize, true) // ChunkSize: 4 + (8 + 16) + (8 + dataSize)\n writeString(view, 8, 'WAVE') // Format\n\n // \"fmt \" sub-chunk\n writeString(view, 12, 'fmt ') // Subchunk1ID\n view.setUint32(16, 16, true) // Subchunk1Size (16 for PCM/Float)\n view.setUint16(20, audioFormat, true) // AudioFormat (3 for float, 1 for PCM)\n view.setUint16(22, numChannels, true) // NumChannels\n view.setUint32(24, sampleRate, true) // SampleRate\n view.setUint32(28, byteRate, true) // ByteRate = SampleRate * NumChannels * BitsPerSample/8\n view.setUint16(32, blockAlign, true) // BlockAlign = NumChannels * BitsPerSample/8\n view.setUint16(34, bitDepth, true) // BitsPerSample\n\n // \"data\" sub-chunk\n writeString(view, 36, 'data') // Subchunk2ID\n view.setUint32(40, dataSize, true) // Subchunk2Size = NumSamples * NumChannels * BitsPerSample/8\n }\n\n if (buffer) {\n // Handle existing buffer\n\n // Check for minimum size\n if (buffer.byteLength < 44) {\n throw new Error('Buffer is too small to contain a valid WAV header')\n }\n\n const view = new DataView(buffer)\n\n // Check if the buffer already has a WAV header by looking for \"RIFF\" at the start\n const existingHeader = view.getUint32(0, false) === 0x52494646 // \"RIFF\" in ASCII\n\n if (existingHeader) {\n // Update the existing header\n writeHeader(view, buffer.byteLength - 44)\n return buffer\n } else {\n // Create a new buffer with header + data\n const newBuffer = new ArrayBuffer(44 + buffer.byteLength)\n const newView = new DataView(newBuffer)\n\n // Write header to new buffer\n writeHeader(newView, buffer.byteLength)\n\n // Copy audio data after header\n new Uint8Array(newBuffer).set(new Uint8Array(buffer), 44)\n return newBuffer\n }\n } else {\n // Create standalone header\n const headerBuffer = new ArrayBuffer(44)\n const view = new DataView(headerBuffer)\n writeHeader(view)\n return headerBuffer\n }\n}\n"]}
|
|
@@ -0,0 +1,294 @@
|
|
|
1
|
+
"use strict";
|
|
2
|
+
// packages/audio-studio/src/workers/InlineFeaturesExtractor.web.tsx
|
|
3
|
+
//
|
|
4
|
+
// The worker blob is assembled at runtime by concatenating:
|
|
5
|
+
// 1. The WASM glue JS string (defines createMelSpectrogramModule)
|
|
6
|
+
// 2. This inline worker code
|
|
7
|
+
//
|
|
8
|
+
// This keeps ONE C++ implementation for spectral/MFCC/chroma across all platforms.
|
|
9
|
+
Object.defineProperty(exports, "__esModule", { value: true });
|
|
10
|
+
exports.InlineFeaturesExtractor = void 0;
|
|
11
|
+
exports.InlineFeaturesExtractor = `
|
|
12
|
+
// --- Constants ---
|
|
13
|
+
const N_FFT = 1024;
|
|
14
|
+
const N_CHROMA = 12;
|
|
15
|
+
const STRUCT_SIZE = 32; // CAudioFeaturesResult
|
|
16
|
+
|
|
17
|
+
// --- WASM module state ---
|
|
18
|
+
let wasmModule = null;
|
|
19
|
+
let wasmInitPromise = null;
|
|
20
|
+
let wasmFramePtr = 0;
|
|
21
|
+
let wasmFrameCapacity = 0;
|
|
22
|
+
let wasmResultPtr = 0;
|
|
23
|
+
|
|
24
|
+
function initWasm(sampleRate) {
|
|
25
|
+
if (wasmInitPromise) return wasmInitPromise;
|
|
26
|
+
wasmInitPromise = (typeof createMelSpectrogramModule === 'function'
|
|
27
|
+
? createMelSpectrogramModule()
|
|
28
|
+
: Promise.reject(new Error('WASM glue not loaded'))
|
|
29
|
+
).then(function(Module) {
|
|
30
|
+
wasmModule = Module;
|
|
31
|
+
Module._audio_features_init(sampleRate, N_FFT, 13, 26, 1, 1);
|
|
32
|
+
wasmResultPtr = Module._malloc(STRUCT_SIZE);
|
|
33
|
+
Module.HEAPU8.fill(0, wasmResultPtr, wasmResultPtr + STRUCT_SIZE);
|
|
34
|
+
return Module;
|
|
35
|
+
}).catch(function(err) {
|
|
36
|
+
wasmInitPromise = null;
|
|
37
|
+
throw err;
|
|
38
|
+
});
|
|
39
|
+
return wasmInitPromise;
|
|
40
|
+
}
|
|
41
|
+
|
|
42
|
+
function readWasmResult(Module, ptr) {
|
|
43
|
+
var getValue = Module.getValue;
|
|
44
|
+
var centroid = getValue(ptr, 'float');
|
|
45
|
+
var flatness = getValue(ptr + 4, 'float');
|
|
46
|
+
var rolloff = getValue(ptr + 8, 'float');
|
|
47
|
+
var bandwidth = getValue(ptr + 12, 'float');
|
|
48
|
+
var mfccPtr = getValue(ptr + 16, 'i32');
|
|
49
|
+
var mfccCount = getValue(ptr + 20, 'i32');
|
|
50
|
+
var chromaPtr = getValue(ptr + 24, 'i32');
|
|
51
|
+
var chromaCount = getValue(ptr + 28, 'i32');
|
|
52
|
+
|
|
53
|
+
var mfcc = [];
|
|
54
|
+
if (mfccPtr && mfccCount > 0) {
|
|
55
|
+
var off = mfccPtr >> 2;
|
|
56
|
+
for (var i = 0; i < mfccCount; i++) mfcc.push(Module.HEAPF32[off + i]);
|
|
57
|
+
}
|
|
58
|
+
var chromagram = [];
|
|
59
|
+
if (chromaPtr && chromaCount > 0) {
|
|
60
|
+
var off2 = chromaPtr >> 2;
|
|
61
|
+
for (var i = 0; i < chromaCount; i++) chromagram.push(Module.HEAPF32[off2 + i]);
|
|
62
|
+
}
|
|
63
|
+
return { centroid: centroid, flatness: flatness, rolloff: rolloff, bandwidth: bandwidth, mfcc: mfcc, chromagram: chromagram };
|
|
64
|
+
}
|
|
65
|
+
|
|
66
|
+
// Compute spectral/MFCC/chroma features for a segment via WASM C++
|
|
67
|
+
function computeFeaturesWasm(segment, sampleRate, featureOptions) {
|
|
68
|
+
if (!wasmModule || !wasmResultPtr) {
|
|
69
|
+
return { centroid: 0, flatness: 0, rolloff: 0, bandwidth: 0, mfcc: [], chromagram: [] };
|
|
70
|
+
}
|
|
71
|
+
var Module = wasmModule;
|
|
72
|
+
var needSpectral = featureOptions.spectralCentroid || featureOptions.spectralFlatness ||
|
|
73
|
+
featureOptions.spectralRolloff || featureOptions.spectralBandwidth;
|
|
74
|
+
var needMfcc = !!featureOptions.mfcc;
|
|
75
|
+
var needChroma = !!featureOptions.chromagram;
|
|
76
|
+
|
|
77
|
+
if (!needSpectral && !needMfcc && !needChroma) {
|
|
78
|
+
return { centroid: 0, flatness: 0, rolloff: 0, bandwidth: 0, mfcc: [], chromagram: [] };
|
|
79
|
+
}
|
|
80
|
+
|
|
81
|
+
// Re-init if needed (different feature flags)
|
|
82
|
+
Module._audio_features_init(sampleRate, N_FFT, 13, 26, needMfcc ? 1 : 0, needChroma ? 1 : 0);
|
|
83
|
+
|
|
84
|
+
// Allocate/grow input buffer on WASM heap
|
|
85
|
+
if (segment.length > wasmFrameCapacity) {
|
|
86
|
+
if (wasmFramePtr) Module._free(wasmFramePtr);
|
|
87
|
+
wasmFramePtr = Module._malloc(segment.length * 4);
|
|
88
|
+
wasmFrameCapacity = segment.length;
|
|
89
|
+
}
|
|
90
|
+
Module.HEAPF32.set(segment, wasmFramePtr >> 2);
|
|
91
|
+
|
|
92
|
+
var ok = Module._audio_features_compute_frame(wasmFramePtr, segment.length, wasmResultPtr);
|
|
93
|
+
if (!ok) {
|
|
94
|
+
return { centroid: 0, flatness: 0, rolloff: 0, bandwidth: 0, mfcc: [], chromagram: [] };
|
|
95
|
+
}
|
|
96
|
+
var result = readWasmResult(Module, wasmResultPtr);
|
|
97
|
+
Module._audio_features_free_arrays(wasmResultPtr);
|
|
98
|
+
return result;
|
|
99
|
+
}
|
|
100
|
+
|
|
101
|
+
// --- JS fallback for HNR (autocorrelation, no FFT needed) ---
|
|
102
|
+
function extractHNR(segmentData) {
|
|
103
|
+
var frameSize = segmentData.length;
|
|
104
|
+
var autocorrelation = new Float32Array(frameSize);
|
|
105
|
+
for (var i = 0; i < frameSize; i++) {
|
|
106
|
+
var sum = 0;
|
|
107
|
+
for (var j = 0; j < frameSize - i; j++) {
|
|
108
|
+
sum += segmentData[j] * segmentData[j + i];
|
|
109
|
+
}
|
|
110
|
+
autocorrelation[i] = sum;
|
|
111
|
+
}
|
|
112
|
+
var maxAutocorrelation = -Infinity;
|
|
113
|
+
for (var i = 1; i < autocorrelation.length; i++) {
|
|
114
|
+
if (autocorrelation[i] > maxAutocorrelation) {
|
|
115
|
+
maxAutocorrelation = autocorrelation[i];
|
|
116
|
+
}
|
|
117
|
+
}
|
|
118
|
+
return autocorrelation[0] !== 0
|
|
119
|
+
? 10 * Math.log10(maxAutocorrelation / (autocorrelation[0] - maxAutocorrelation))
|
|
120
|
+
: 0;
|
|
121
|
+
}
|
|
122
|
+
|
|
123
|
+
// --- JS fallback for pitch estimation (simple peak-picking) ---
|
|
124
|
+
function estimatePitch(segment, sampleRate) {
|
|
125
|
+
if (!segment || segment.length < 2 || !sampleRate) return 0;
|
|
126
|
+
// Simple autocorrelation-based pitch
|
|
127
|
+
var minLag = Math.floor(sampleRate / 1000); // 1000 Hz max
|
|
128
|
+
var maxLag = Math.floor(sampleRate / 50); // 50 Hz min
|
|
129
|
+
if (maxLag >= segment.length) maxLag = segment.length - 1;
|
|
130
|
+
var bestCorr = -Infinity;
|
|
131
|
+
var bestLag = 0;
|
|
132
|
+
for (var lag = minLag; lag <= maxLag; lag++) {
|
|
133
|
+
var corr = 0;
|
|
134
|
+
for (var i = 0; i < segment.length - lag; i++) {
|
|
135
|
+
corr += segment[i] * segment[i + lag];
|
|
136
|
+
}
|
|
137
|
+
if (corr > bestCorr) {
|
|
138
|
+
bestCorr = corr;
|
|
139
|
+
bestLag = lag;
|
|
140
|
+
}
|
|
141
|
+
}
|
|
142
|
+
return bestLag > 0 ? sampleRate / bestLag : 0;
|
|
143
|
+
}
|
|
144
|
+
|
|
145
|
+
// --- Unique ID counter ---
|
|
146
|
+
let uniqueIdCounter = 0;
|
|
147
|
+
|
|
148
|
+
// --- Message handler ---
|
|
149
|
+
self.onmessage = function (event) {
|
|
150
|
+
var enableLogging = event.data.enableLogging || false;
|
|
151
|
+
|
|
152
|
+
// Reset command
|
|
153
|
+
if (event.data.command === 'resetCounter') {
|
|
154
|
+
var newValue = event.data.value;
|
|
155
|
+
uniqueIdCounter = typeof newValue === 'number' ? newValue : 0;
|
|
156
|
+
return;
|
|
157
|
+
}
|
|
158
|
+
|
|
159
|
+
var channelData = event.data.channelData;
|
|
160
|
+
var sampleRate = event.data.sampleRate;
|
|
161
|
+
var segmentDurationMs = event.data.segmentDurationMs;
|
|
162
|
+
var bitDepth = event.data.bitDepth;
|
|
163
|
+
var fullAudioDurationMs = event.data.fullAudioDurationMs;
|
|
164
|
+
var numberOfChannels = event.data.numberOfChannels;
|
|
165
|
+
var _features = event.data.features;
|
|
166
|
+
var features = _features || {};
|
|
167
|
+
var bytesPerSample = bitDepth / 8;
|
|
168
|
+
|
|
169
|
+
var subChunkStartTime = (typeof fullAudioDurationMs === 'number' && !isNaN(fullAudioDurationMs) && fullAudioDurationMs >= 0)
|
|
170
|
+
? fullAudioDurationMs / 1000 : 0;
|
|
171
|
+
|
|
172
|
+
// Check if any C++-backed features are requested
|
|
173
|
+
var needWasm = features.spectralCentroid || features.spectralFlatness ||
|
|
174
|
+
features.spectralRolloff || features.spectralBandwidth ||
|
|
175
|
+
features.mfcc || features.chromagram;
|
|
176
|
+
|
|
177
|
+
function createFeaturesObject(maxAmp, rms, sumSquares, zeroCrossings, segLen, wasmResult, startIdx, endIdx) {
|
|
178
|
+
if (!Object.values(features).some(function(v) { return v; })) return undefined;
|
|
179
|
+
var result = {};
|
|
180
|
+
if (features.energy) result.energy = sumSquares;
|
|
181
|
+
if (features.rms) result.rms = rms;
|
|
182
|
+
result.minAmplitude = -maxAmp;
|
|
183
|
+
result.maxAmplitude = maxAmp;
|
|
184
|
+
if (features.zcr) result.zcr = zeroCrossings / segLen;
|
|
185
|
+
if (features.spectralCentroid) result.spectralCentroid = wasmResult.centroid;
|
|
186
|
+
if (features.spectralFlatness) result.spectralFlatness = wasmResult.flatness;
|
|
187
|
+
if (features.spectralRolloff) result.spectralRolloff = wasmResult.rolloff;
|
|
188
|
+
if (features.spectralBandwidth) result.spectralBandwidth = wasmResult.bandwidth;
|
|
189
|
+
if (features.mfcc) result.mfcc = wasmResult.mfcc;
|
|
190
|
+
if (features.chromagram) result.chromagram = wasmResult.chromagram;
|
|
191
|
+
if (features.hnr) result.hnr = extractHNR(channelData.slice(startIdx, endIdx));
|
|
192
|
+
if (features.pitch) result.pitch = estimatePitch(channelData.slice(startIdx, endIdx), sampleRate);
|
|
193
|
+
return result;
|
|
194
|
+
}
|
|
195
|
+
|
|
196
|
+
function processSegment(startIdx, endIdx, segLen) {
|
|
197
|
+
var sumSquares = 0, maxAmp = 0, zeroCrossings = 0;
|
|
198
|
+
for (var j = startIdx; j < endIdx; j++) {
|
|
199
|
+
var value = channelData[j];
|
|
200
|
+
sumSquares += value * value;
|
|
201
|
+
if (Math.abs(value) > maxAmp) maxAmp = Math.abs(value);
|
|
202
|
+
if (j > 0 && value * channelData[j - 1] < 0) zeroCrossings++;
|
|
203
|
+
}
|
|
204
|
+
var rms = Math.sqrt(sumSquares / segLen);
|
|
205
|
+
var wasmResult = needWasm
|
|
206
|
+
? computeFeaturesWasm(channelData.slice(startIdx, endIdx), sampleRate, features)
|
|
207
|
+
: { centroid: 0, flatness: 0, rolloff: 0, bandwidth: 0, mfcc: [], chromagram: [] };
|
|
208
|
+
|
|
209
|
+
var dataPoint = {
|
|
210
|
+
id: uniqueIdCounter++,
|
|
211
|
+
amplitude: maxAmp,
|
|
212
|
+
rms: rms,
|
|
213
|
+
startTime: subChunkStartTime + (startIdx / sampleRate),
|
|
214
|
+
endTime: subChunkStartTime + (endIdx / sampleRate),
|
|
215
|
+
dB: 20 * Math.log10(rms + 1e-6),
|
|
216
|
+
silent: rms < 0.01,
|
|
217
|
+
startPosition: startIdx * (numberOfChannels || 1) * bytesPerSample,
|
|
218
|
+
endPosition: endIdx * (numberOfChannels || 1) * bytesPerSample,
|
|
219
|
+
samples: segLen,
|
|
220
|
+
};
|
|
221
|
+
var ef = createFeaturesObject(maxAmp, rms, sumSquares, zeroCrossings, segLen, wasmResult, startIdx, endIdx);
|
|
222
|
+
if (ef) dataPoint.features = ef;
|
|
223
|
+
return dataPoint;
|
|
224
|
+
}
|
|
225
|
+
|
|
226
|
+
function extractWaveform() {
|
|
227
|
+
var totalSamples = channelData.length;
|
|
228
|
+
var durationMs = (totalSamples / sampleRate) * 1000;
|
|
229
|
+
var samplesPerSegment = Math.floor(sampleRate * (segmentDurationMs / 1000));
|
|
230
|
+
var numPoints = Math.floor(totalSamples / samplesPerSegment);
|
|
231
|
+
var remainingSamples = totalSamples % samplesPerSegment;
|
|
232
|
+
|
|
233
|
+
var min = Infinity, max = -Infinity;
|
|
234
|
+
for (var i = 0; i < totalSamples; i++) {
|
|
235
|
+
if (channelData[i] < min) min = channelData[i];
|
|
236
|
+
if (channelData[i] > max) max = channelData[i];
|
|
237
|
+
}
|
|
238
|
+
|
|
239
|
+
var dataPoints = [];
|
|
240
|
+
for (var i = 0; i < numPoints; i++) {
|
|
241
|
+
var startIdx = i * samplesPerSegment;
|
|
242
|
+
dataPoints.push(processSegment(startIdx, startIdx + samplesPerSegment, samplesPerSegment));
|
|
243
|
+
}
|
|
244
|
+
if (remainingSamples > samplesPerSegment / 4) {
|
|
245
|
+
var startIdx = numPoints * samplesPerSegment;
|
|
246
|
+
dataPoints.push(processSegment(startIdx, totalSamples, totalSamples - startIdx));
|
|
247
|
+
}
|
|
248
|
+
return {
|
|
249
|
+
durationMs: durationMs,
|
|
250
|
+
dataPoints: dataPoints,
|
|
251
|
+
amplitudeRange: { min: min, max: max },
|
|
252
|
+
rmsRange: { min: 0, max: Math.max(Math.abs(min), Math.abs(max)) }
|
|
253
|
+
};
|
|
254
|
+
}
|
|
255
|
+
|
|
256
|
+
// Main: init WASM if needed, then process
|
|
257
|
+
var doProcess = function() {
|
|
258
|
+
try {
|
|
259
|
+
var t0 = performance.now();
|
|
260
|
+
var result = extractWaveform();
|
|
261
|
+
var t1 = performance.now();
|
|
262
|
+
self.postMessage({
|
|
263
|
+
command: 'features',
|
|
264
|
+
result: {
|
|
265
|
+
bitDepth: bitDepth,
|
|
266
|
+
samples: channelData.length,
|
|
267
|
+
numberOfChannels: numberOfChannels,
|
|
268
|
+
sampleRate: sampleRate,
|
|
269
|
+
segmentDurationMs: segmentDurationMs,
|
|
270
|
+
durationMs: result.durationMs,
|
|
271
|
+
dataPoints: result.dataPoints,
|
|
272
|
+
amplitudeRange: result.amplitudeRange,
|
|
273
|
+
rmsRange: result.rmsRange,
|
|
274
|
+
extractionTimeMs: t1 - t0,
|
|
275
|
+
}
|
|
276
|
+
});
|
|
277
|
+
} catch (error) {
|
|
278
|
+
console.error('[Worker] Error', { message: error.message, stack: error.stack });
|
|
279
|
+
self.postMessage({ error: { message: error.message, stack: error.stack, name: error.name } });
|
|
280
|
+
}
|
|
281
|
+
};
|
|
282
|
+
|
|
283
|
+
if (needWasm && !wasmModule) {
|
|
284
|
+
initWasm(sampleRate).then(doProcess).catch(function(e) {
|
|
285
|
+
console.error('[Worker] WASM init failed, processing without WASM:', e);
|
|
286
|
+
needWasm = false;
|
|
287
|
+
doProcess();
|
|
288
|
+
});
|
|
289
|
+
} else {
|
|
290
|
+
doProcess();
|
|
291
|
+
}
|
|
292
|
+
};
|
|
293
|
+
`;
|
|
294
|
+
//# sourceMappingURL=InlineFeaturesExtractor.web.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"InlineFeaturesExtractor.web.js","sourceRoot":"","sources":["../../../src/workers/InlineFeaturesExtractor.web.tsx"],"names":[],"mappings":";AAAA,oEAAoE;AACpE,EAAE;AACF,4DAA4D;AAC5D,oEAAoE;AACpE,+BAA+B;AAC/B,EAAE;AACF,mFAAmF;;;AAEtE,QAAA,uBAAuB,GAAG;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;CA0RtC,CAAA","sourcesContent":["// packages/audio-studio/src/workers/InlineFeaturesExtractor.web.tsx\n//\n// The worker blob is assembled at runtime by concatenating:\n// 1. The WASM glue JS string (defines createMelSpectrogramModule)\n// 2. This inline worker code\n//\n// This keeps ONE C++ implementation for spectral/MFCC/chroma across all platforms.\n\nexport const InlineFeaturesExtractor = `\n// --- Constants ---\nconst N_FFT = 1024;\nconst N_CHROMA = 12;\nconst STRUCT_SIZE = 32; // CAudioFeaturesResult\n\n// --- WASM module state ---\nlet wasmModule = null;\nlet wasmInitPromise = null;\nlet wasmFramePtr = 0;\nlet wasmFrameCapacity = 0;\nlet wasmResultPtr = 0;\n\nfunction initWasm(sampleRate) {\n if (wasmInitPromise) return wasmInitPromise;\n wasmInitPromise = (typeof createMelSpectrogramModule === 'function'\n ? createMelSpectrogramModule()\n : Promise.reject(new Error('WASM glue not loaded'))\n ).then(function(Module) {\n wasmModule = Module;\n Module._audio_features_init(sampleRate, N_FFT, 13, 26, 1, 1);\n wasmResultPtr = Module._malloc(STRUCT_SIZE);\n Module.HEAPU8.fill(0, wasmResultPtr, wasmResultPtr + STRUCT_SIZE);\n return Module;\n }).catch(function(err) {\n wasmInitPromise = null;\n throw err;\n });\n return wasmInitPromise;\n}\n\nfunction readWasmResult(Module, ptr) {\n var getValue = Module.getValue;\n var centroid = getValue(ptr, 'float');\n var flatness = getValue(ptr + 4, 'float');\n var rolloff = getValue(ptr + 8, 'float');\n var bandwidth = getValue(ptr + 12, 'float');\n var mfccPtr = getValue(ptr + 16, 'i32');\n var mfccCount = getValue(ptr + 20, 'i32');\n var chromaPtr = getValue(ptr + 24, 'i32');\n var chromaCount = getValue(ptr + 28, 'i32');\n\n var mfcc = [];\n if (mfccPtr && mfccCount > 0) {\n var off = mfccPtr >> 2;\n for (var i = 0; i < mfccCount; i++) mfcc.push(Module.HEAPF32[off + i]);\n }\n var chromagram = [];\n if (chromaPtr && chromaCount > 0) {\n var off2 = chromaPtr >> 2;\n for (var i = 0; i < chromaCount; i++) chromagram.push(Module.HEAPF32[off2 + i]);\n }\n return { centroid: centroid, flatness: flatness, rolloff: rolloff, bandwidth: bandwidth, mfcc: mfcc, chromagram: chromagram };\n}\n\n// Compute spectral/MFCC/chroma features for a segment via WASM C++\nfunction computeFeaturesWasm(segment, sampleRate, featureOptions) {\n if (!wasmModule || !wasmResultPtr) {\n return { centroid: 0, flatness: 0, rolloff: 0, bandwidth: 0, mfcc: [], chromagram: [] };\n }\n var Module = wasmModule;\n var needSpectral = featureOptions.spectralCentroid || featureOptions.spectralFlatness ||\n featureOptions.spectralRolloff || featureOptions.spectralBandwidth;\n var needMfcc = !!featureOptions.mfcc;\n var needChroma = !!featureOptions.chromagram;\n\n if (!needSpectral && !needMfcc && !needChroma) {\n return { centroid: 0, flatness: 0, rolloff: 0, bandwidth: 0, mfcc: [], chromagram: [] };\n }\n\n // Re-init if needed (different feature flags)\n Module._audio_features_init(sampleRate, N_FFT, 13, 26, needMfcc ? 1 : 0, needChroma ? 1 : 0);\n\n // Allocate/grow input buffer on WASM heap\n if (segment.length > wasmFrameCapacity) {\n if (wasmFramePtr) Module._free(wasmFramePtr);\n wasmFramePtr = Module._malloc(segment.length * 4);\n wasmFrameCapacity = segment.length;\n }\n Module.HEAPF32.set(segment, wasmFramePtr >> 2);\n\n var ok = Module._audio_features_compute_frame(wasmFramePtr, segment.length, wasmResultPtr);\n if (!ok) {\n return { centroid: 0, flatness: 0, rolloff: 0, bandwidth: 0, mfcc: [], chromagram: [] };\n }\n var result = readWasmResult(Module, wasmResultPtr);\n Module._audio_features_free_arrays(wasmResultPtr);\n return result;\n}\n\n// --- JS fallback for HNR (autocorrelation, no FFT needed) ---\nfunction extractHNR(segmentData) {\n var frameSize = segmentData.length;\n var autocorrelation = new Float32Array(frameSize);\n for (var i = 0; i < frameSize; i++) {\n var sum = 0;\n for (var j = 0; j < frameSize - i; j++) {\n sum += segmentData[j] * segmentData[j + i];\n }\n autocorrelation[i] = sum;\n }\n var maxAutocorrelation = -Infinity;\n for (var i = 1; i < autocorrelation.length; i++) {\n if (autocorrelation[i] > maxAutocorrelation) {\n maxAutocorrelation = autocorrelation[i];\n }\n }\n return autocorrelation[0] !== 0\n ? 10 * Math.log10(maxAutocorrelation / (autocorrelation[0] - maxAutocorrelation))\n : 0;\n}\n\n// --- JS fallback for pitch estimation (simple peak-picking) ---\nfunction estimatePitch(segment, sampleRate) {\n if (!segment || segment.length < 2 || !sampleRate) return 0;\n // Simple autocorrelation-based pitch\n var minLag = Math.floor(sampleRate / 1000); // 1000 Hz max\n var maxLag = Math.floor(sampleRate / 50); // 50 Hz min\n if (maxLag >= segment.length) maxLag = segment.length - 1;\n var bestCorr = -Infinity;\n var bestLag = 0;\n for (var lag = minLag; lag <= maxLag; lag++) {\n var corr = 0;\n for (var i = 0; i < segment.length - lag; i++) {\n corr += segment[i] * segment[i + lag];\n }\n if (corr > bestCorr) {\n bestCorr = corr;\n bestLag = lag;\n }\n }\n return bestLag > 0 ? sampleRate / bestLag : 0;\n}\n\n// --- Unique ID counter ---\nlet uniqueIdCounter = 0;\n\n// --- Message handler ---\nself.onmessage = function (event) {\n var enableLogging = event.data.enableLogging || false;\n\n // Reset command\n if (event.data.command === 'resetCounter') {\n var newValue = event.data.value;\n uniqueIdCounter = typeof newValue === 'number' ? newValue : 0;\n return;\n }\n\n var channelData = event.data.channelData;\n var sampleRate = event.data.sampleRate;\n var segmentDurationMs = event.data.segmentDurationMs;\n var bitDepth = event.data.bitDepth;\n var fullAudioDurationMs = event.data.fullAudioDurationMs;\n var numberOfChannels = event.data.numberOfChannels;\n var _features = event.data.features;\n var features = _features || {};\n var bytesPerSample = bitDepth / 8;\n\n var subChunkStartTime = (typeof fullAudioDurationMs === 'number' && !isNaN(fullAudioDurationMs) && fullAudioDurationMs >= 0)\n ? fullAudioDurationMs / 1000 : 0;\n\n // Check if any C++-backed features are requested\n var needWasm = features.spectralCentroid || features.spectralFlatness ||\n features.spectralRolloff || features.spectralBandwidth ||\n features.mfcc || features.chromagram;\n\n function createFeaturesObject(maxAmp, rms, sumSquares, zeroCrossings, segLen, wasmResult, startIdx, endIdx) {\n if (!Object.values(features).some(function(v) { return v; })) return undefined;\n var result = {};\n if (features.energy) result.energy = sumSquares;\n if (features.rms) result.rms = rms;\n result.minAmplitude = -maxAmp;\n result.maxAmplitude = maxAmp;\n if (features.zcr) result.zcr = zeroCrossings / segLen;\n if (features.spectralCentroid) result.spectralCentroid = wasmResult.centroid;\n if (features.spectralFlatness) result.spectralFlatness = wasmResult.flatness;\n if (features.spectralRolloff) result.spectralRolloff = wasmResult.rolloff;\n if (features.spectralBandwidth) result.spectralBandwidth = wasmResult.bandwidth;\n if (features.mfcc) result.mfcc = wasmResult.mfcc;\n if (features.chromagram) result.chromagram = wasmResult.chromagram;\n if (features.hnr) result.hnr = extractHNR(channelData.slice(startIdx, endIdx));\n if (features.pitch) result.pitch = estimatePitch(channelData.slice(startIdx, endIdx), sampleRate);\n return result;\n }\n\n function processSegment(startIdx, endIdx, segLen) {\n var sumSquares = 0, maxAmp = 0, zeroCrossings = 0;\n for (var j = startIdx; j < endIdx; j++) {\n var value = channelData[j];\n sumSquares += value * value;\n if (Math.abs(value) > maxAmp) maxAmp = Math.abs(value);\n if (j > 0 && value * channelData[j - 1] < 0) zeroCrossings++;\n }\n var rms = Math.sqrt(sumSquares / segLen);\n var wasmResult = needWasm\n ? computeFeaturesWasm(channelData.slice(startIdx, endIdx), sampleRate, features)\n : { centroid: 0, flatness: 0, rolloff: 0, bandwidth: 0, mfcc: [], chromagram: [] };\n\n var dataPoint = {\n id: uniqueIdCounter++,\n amplitude: maxAmp,\n rms: rms,\n startTime: subChunkStartTime + (startIdx / sampleRate),\n endTime: subChunkStartTime + (endIdx / sampleRate),\n dB: 20 * Math.log10(rms + 1e-6),\n silent: rms < 0.01,\n startPosition: startIdx * (numberOfChannels || 1) * bytesPerSample,\n endPosition: endIdx * (numberOfChannels || 1) * bytesPerSample,\n samples: segLen,\n };\n var ef = createFeaturesObject(maxAmp, rms, sumSquares, zeroCrossings, segLen, wasmResult, startIdx, endIdx);\n if (ef) dataPoint.features = ef;\n return dataPoint;\n }\n\n function extractWaveform() {\n var totalSamples = channelData.length;\n var durationMs = (totalSamples / sampleRate) * 1000;\n var samplesPerSegment = Math.floor(sampleRate * (segmentDurationMs / 1000));\n var numPoints = Math.floor(totalSamples / samplesPerSegment);\n var remainingSamples = totalSamples % samplesPerSegment;\n\n var min = Infinity, max = -Infinity;\n for (var i = 0; i < totalSamples; i++) {\n if (channelData[i] < min) min = channelData[i];\n if (channelData[i] > max) max = channelData[i];\n }\n\n var dataPoints = [];\n for (var i = 0; i < numPoints; i++) {\n var startIdx = i * samplesPerSegment;\n dataPoints.push(processSegment(startIdx, startIdx + samplesPerSegment, samplesPerSegment));\n }\n if (remainingSamples > samplesPerSegment / 4) {\n var startIdx = numPoints * samplesPerSegment;\n dataPoints.push(processSegment(startIdx, totalSamples, totalSamples - startIdx));\n }\n return {\n durationMs: durationMs,\n dataPoints: dataPoints,\n amplitudeRange: { min: min, max: max },\n rmsRange: { min: 0, max: Math.max(Math.abs(min), Math.abs(max)) }\n };\n }\n\n // Main: init WASM if needed, then process\n var doProcess = function() {\n try {\n var t0 = performance.now();\n var result = extractWaveform();\n var t1 = performance.now();\n self.postMessage({\n command: 'features',\n result: {\n bitDepth: bitDepth,\n samples: channelData.length,\n numberOfChannels: numberOfChannels,\n sampleRate: sampleRate,\n segmentDurationMs: segmentDurationMs,\n durationMs: result.durationMs,\n dataPoints: result.dataPoints,\n amplitudeRange: result.amplitudeRange,\n rmsRange: result.rmsRange,\n extractionTimeMs: t1 - t0,\n }\n });\n } catch (error) {\n console.error('[Worker] Error', { message: error.message, stack: error.stack });\n self.postMessage({ error: { message: error.message, stack: error.stack, name: error.name } });\n }\n };\n\n if (needWasm && !wasmModule) {\n initWasm(sampleRate).then(doProcess).catch(function(e) {\n console.error('[Worker] WASM init failed, processing without WASM:', e);\n needWasm = false;\n doProcess();\n });\n } else {\n doProcess();\n }\n};\n`\n"]}
|