@siteed/expo-audio-stream 2.0.1 → 2.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (166) hide show
  1. package/README.md +46 -27
  2. package/build/index.d.ts +11 -12
  3. package/build/index.js +44 -10
  4. package/package.json +49 -110
  5. package/src/index.ts +18 -33
  6. package/CHANGELOG.md +0 -195
  7. package/android/build.gradle +0 -105
  8. package/android/src/main/AndroidManifest.xml +0 -27
  9. package/android/src/main/java/net/siteed/audiostream/AudioAnalysisData.kt +0 -166
  10. package/android/src/main/java/net/siteed/audiostream/AudioDataEncoder.kt +0 -9
  11. package/android/src/main/java/net/siteed/audiostream/AudioFileHandler.kt +0 -131
  12. package/android/src/main/java/net/siteed/audiostream/AudioFormatUtils.kt +0 -103
  13. package/android/src/main/java/net/siteed/audiostream/AudioNotificationsManager.kt +0 -435
  14. package/android/src/main/java/net/siteed/audiostream/AudioProcessor.kt +0 -1936
  15. package/android/src/main/java/net/siteed/audiostream/AudioRecorderManager.kt +0 -1437
  16. package/android/src/main/java/net/siteed/audiostream/AudioRecordingService.kt +0 -138
  17. package/android/src/main/java/net/siteed/audiostream/Constants.kt +0 -20
  18. package/android/src/main/java/net/siteed/audiostream/EventSender.kt +0 -7
  19. package/android/src/main/java/net/siteed/audiostream/ExpoAudioStreamModule.kt +0 -509
  20. package/android/src/main/java/net/siteed/audiostream/FFT.kt +0 -99
  21. package/android/src/main/java/net/siteed/audiostream/Features.kt +0 -98
  22. package/android/src/main/java/net/siteed/audiostream/NotificationConfig.kt +0 -70
  23. package/android/src/main/java/net/siteed/audiostream/PermissionUtils.kt +0 -59
  24. package/android/src/main/java/net/siteed/audiostream/RecordingActionReceiver.kt +0 -59
  25. package/android/src/main/java/net/siteed/audiostream/RecordingConfig.kt +0 -205
  26. package/android/src/main/java/net/siteed/audiostream/WaveformConfig.kt +0 -19
  27. package/android/src/main/java/net/siteed/audiostream/WaveformRenderer.kt +0 -159
  28. package/android/src/main/res/drawable/ic_default_action_icon.xml +0 -16
  29. package/android/src/main/res/drawable/ic_microphone.xml +0 -13
  30. package/android/src/main/res/drawable/ic_pause.xml +0 -10
  31. package/android/src/main/res/drawable/ic_play.xml +0 -10
  32. package/android/src/main/res/drawable/ic_stop.xml +0 -10
  33. package/android/src/main/res/layout/notification_recording.xml +0 -37
  34. package/android/src/main/test/java/net/siteed/audiostream/AudioProcessorTest.kt +0 -56
  35. package/app.plugin.js +0 -1
  36. package/build/AudioAnalysis/AudioAnalysis.types.d.ts +0 -144
  37. package/build/AudioAnalysis/AudioAnalysis.types.d.ts.map +0 -1
  38. package/build/AudioAnalysis/AudioAnalysis.types.js +0 -3
  39. package/build/AudioAnalysis/AudioAnalysis.types.js.map +0 -1
  40. package/build/AudioAnalysis/extractAudioAnalysis.d.ts +0 -78
  41. package/build/AudioAnalysis/extractAudioAnalysis.d.ts.map +0 -1
  42. package/build/AudioAnalysis/extractAudioAnalysis.js +0 -229
  43. package/build/AudioAnalysis/extractAudioAnalysis.js.map +0 -1
  44. package/build/AudioAnalysis/extractWaveform.d.ts +0 -8
  45. package/build/AudioAnalysis/extractWaveform.d.ts.map +0 -1
  46. package/build/AudioAnalysis/extractWaveform.js +0 -11
  47. package/build/AudioAnalysis/extractWaveform.js.map +0 -1
  48. package/build/AudioRecorder.provider.d.ts +0 -11
  49. package/build/AudioRecorder.provider.d.ts.map +0 -1
  50. package/build/AudioRecorder.provider.js +0 -37
  51. package/build/AudioRecorder.provider.js.map +0 -1
  52. package/build/ExpoAudioStream.native.d.ts +0 -3
  53. package/build/ExpoAudioStream.native.d.ts.map +0 -1
  54. package/build/ExpoAudioStream.native.js +0 -6
  55. package/build/ExpoAudioStream.native.js.map +0 -1
  56. package/build/ExpoAudioStream.types.d.ts +0 -206
  57. package/build/ExpoAudioStream.types.d.ts.map +0 -1
  58. package/build/ExpoAudioStream.types.js +0 -2
  59. package/build/ExpoAudioStream.types.js.map +0 -1
  60. package/build/ExpoAudioStream.web.d.ts +0 -59
  61. package/build/ExpoAudioStream.web.d.ts.map +0 -1
  62. package/build/ExpoAudioStream.web.js +0 -285
  63. package/build/ExpoAudioStream.web.js.map +0 -1
  64. package/build/ExpoAudioStreamModule.d.ts +0 -3
  65. package/build/ExpoAudioStreamModule.d.ts.map +0 -1
  66. package/build/ExpoAudioStreamModule.js +0 -239
  67. package/build/ExpoAudioStreamModule.js.map +0 -1
  68. package/build/WebRecorder.web.d.ts +0 -119
  69. package/build/WebRecorder.web.d.ts.map +0 -1
  70. package/build/WebRecorder.web.js +0 -436
  71. package/build/WebRecorder.web.js.map +0 -1
  72. package/build/constants.d.ts +0 -11
  73. package/build/constants.d.ts.map +0 -1
  74. package/build/constants.js +0 -14
  75. package/build/constants.js.map +0 -1
  76. package/build/events.d.ts +0 -26
  77. package/build/events.d.ts.map +0 -1
  78. package/build/events.js +0 -21
  79. package/build/events.js.map +0 -1
  80. package/build/index.d.ts.map +0 -1
  81. package/build/index.js.map +0 -1
  82. package/build/useAudioRecorder.d.ts +0 -21
  83. package/build/useAudioRecorder.d.ts.map +0 -1
  84. package/build/useAudioRecorder.js +0 -427
  85. package/build/useAudioRecorder.js.map +0 -1
  86. package/build/utils/BlobFix.d.ts +0 -9
  87. package/build/utils/BlobFix.d.ts.map +0 -1
  88. package/build/utils/BlobFix.js +0 -498
  89. package/build/utils/BlobFix.js.map +0 -1
  90. package/build/utils/audioProcessing.d.ts +0 -24
  91. package/build/utils/audioProcessing.d.ts.map +0 -1
  92. package/build/utils/audioProcessing.js +0 -133
  93. package/build/utils/audioProcessing.js.map +0 -1
  94. package/build/utils/concatenateBuffers.d.ts +0 -8
  95. package/build/utils/concatenateBuffers.d.ts.map +0 -1
  96. package/build/utils/concatenateBuffers.js +0 -21
  97. package/build/utils/concatenateBuffers.js.map +0 -1
  98. package/build/utils/convertPCMToFloat32.d.ts +0 -13
  99. package/build/utils/convertPCMToFloat32.d.ts.map +0 -1
  100. package/build/utils/convertPCMToFloat32.js +0 -120
  101. package/build/utils/convertPCMToFloat32.js.map +0 -1
  102. package/build/utils/encodingToBitDepth.d.ts +0 -5
  103. package/build/utils/encodingToBitDepth.d.ts.map +0 -1
  104. package/build/utils/encodingToBitDepth.js +0 -13
  105. package/build/utils/encodingToBitDepth.js.map +0 -1
  106. package/build/utils/getWavFileInfo.d.ts +0 -26
  107. package/build/utils/getWavFileInfo.d.ts.map +0 -1
  108. package/build/utils/getWavFileInfo.js +0 -92
  109. package/build/utils/getWavFileInfo.js.map +0 -1
  110. package/build/utils/writeWavHeader.d.ts +0 -49
  111. package/build/utils/writeWavHeader.d.ts.map +0 -1
  112. package/build/utils/writeWavHeader.js +0 -91
  113. package/build/utils/writeWavHeader.js.map +0 -1
  114. package/build/workers/InlineFeaturesExtractor.web.d.ts +0 -2
  115. package/build/workers/InlineFeaturesExtractor.web.d.ts.map +0 -1
  116. package/build/workers/InlineFeaturesExtractor.web.js +0 -828
  117. package/build/workers/InlineFeaturesExtractor.web.js.map +0 -1
  118. package/build/workers/inlineAudioWebWorker.web.d.ts +0 -2
  119. package/build/workers/inlineAudioWebWorker.web.d.ts.map +0 -1
  120. package/build/workers/inlineAudioWebWorker.web.js +0 -157
  121. package/build/workers/inlineAudioWebWorker.web.js.map +0 -1
  122. package/expo-module.config.json +0 -9
  123. package/ios/AudioAnalysisData.swift +0 -74
  124. package/ios/AudioNotificationManager.swift +0 -135
  125. package/ios/AudioProcessingHelpers.swift +0 -743
  126. package/ios/AudioProcessor.swift +0 -858
  127. package/ios/AudioStreamError.swift +0 -7
  128. package/ios/AudioStreamManager.swift +0 -1708
  129. package/ios/AudioStreamManagerDelegate.swift +0 -16
  130. package/ios/DataPoint.swift +0 -54
  131. package/ios/DecodingConfig.swift +0 -47
  132. package/ios/ExpoAudioStream.podspec +0 -27
  133. package/ios/ExpoAudioStreamModule.swift +0 -698
  134. package/ios/FFT.swift +0 -62
  135. package/ios/Features.swift +0 -95
  136. package/ios/Logger.swift +0 -7
  137. package/ios/NotificationExtension.swift +0 -15
  138. package/ios/RecordingResult.swift +0 -22
  139. package/ios/RecordingSettings.swift +0 -265
  140. package/ios/WaveformExtractor.swift +0 -105
  141. package/plugin/build/index.d.ts +0 -21
  142. package/plugin/build/index.js +0 -191
  143. package/plugin/src/index.ts +0 -278
  144. package/plugin/tsconfig.json +0 -10
  145. package/plugin/tsconfig.tsbuildinfo +0 -1
  146. package/src/AudioAnalysis/AudioAnalysis.types.ts +0 -165
  147. package/src/AudioAnalysis/extractAudioAnalysis.ts +0 -370
  148. package/src/AudioAnalysis/extractWaveform.ts +0 -22
  149. package/src/AudioRecorder.provider.tsx +0 -54
  150. package/src/ExpoAudioStream.native.ts +0 -6
  151. package/src/ExpoAudioStream.types.ts +0 -329
  152. package/src/ExpoAudioStream.web.ts +0 -359
  153. package/src/ExpoAudioStreamModule.ts +0 -286
  154. package/src/WebRecorder.web.ts +0 -580
  155. package/src/constants.ts +0 -18
  156. package/src/events.ts +0 -60
  157. package/src/useAudioRecorder.tsx +0 -620
  158. package/src/utils/BlobFix.ts +0 -559
  159. package/src/utils/audioProcessing.ts +0 -205
  160. package/src/utils/concatenateBuffers.ts +0 -24
  161. package/src/utils/convertPCMToFloat32.ts +0 -170
  162. package/src/utils/encodingToBitDepth.ts +0 -18
  163. package/src/utils/getWavFileInfo.ts +0 -132
  164. package/src/utils/writeWavHeader.ts +0 -114
  165. package/src/workers/InlineFeaturesExtractor.web.tsx +0 -827
  166. package/src/workers/inlineAudioWebWorker.web.tsx +0 -156
@@ -1,828 +0,0 @@
1
- // packages/expo-audio-stream/src/workers/InlineFeaturesExtractor.web.tsx
2
- export const InlineFeaturesExtractor = `
3
- // Constants
4
- const N_FFT = 1024; // Default FFT size
5
- const MAX_FFT_SIZE = 8192; // Maximum FFT size to prevent memory issues
6
- const N_CHROMA = 12;
7
-
8
- // FFT Implementation with normalized Hann window
9
- function FFT(n) {
10
- this.n = n;
11
- this.cosTable = new Float32Array(n / 2);
12
- this.sinTable = new Float32Array(n / 2);
13
- this.hannWindow = new Float32Array(n);
14
-
15
- // Match Android implementation with precomputed tables
16
- const normalizationFactor = Math.sqrt(2.0 / n);
17
- for (var i = 0; i < n / 2; i++) {
18
- this.cosTable[i] = Math.cos(2.0 * Math.PI * i / n);
19
- this.sinTable[i] = Math.sin(2.0 * Math.PI * i / n);
20
- }
21
-
22
- // Precompute normalized Hann window to match Android
23
- for (var i = 0; i < n; i++) {
24
- this.hannWindow[i] = normalizationFactor * 0.5 * (1 - Math.cos(2.0 * Math.PI * i / (n - 1)));
25
- }
26
- }
27
-
28
- FFT.prototype.transform = function(data) {
29
- const n = data.length;
30
-
31
- // Validate input length is power of 2
32
- if ((n & (n - 1)) !== 0) {
33
- throw new Error('FFT length must be power of 2');
34
- }
35
-
36
- // Use iterative bit reversal instead of recursive
37
- const bitReversedIndices = new Uint32Array(n);
38
- for (let i = 0; i < n; i++) {
39
- let reversed = 0;
40
- let j = i;
41
- let bits = Math.log2(n);
42
- while (bits--) {
43
- reversed = (reversed << 1) | (j & 1);
44
- j >>= 1;
45
- }
46
- bitReversedIndices[i] = reversed;
47
- }
48
-
49
- // Apply bit reversal
50
- for (let i = 0; i < n; i++) {
51
- const j = bitReversedIndices[i];
52
- if (i < j) {
53
- const temp = data[i];
54
- data[i] = data[j];
55
- data[j] = temp;
56
- }
57
- }
58
-
59
- // Iterative FFT computation with optimized memory usage
60
- for (let step = 1; step < n; step <<= 1) {
61
- const jump = step << 1;
62
- const angleStep = Math.PI / step;
63
-
64
- for (let group = 0; group < n; group += jump) {
65
- for (let pair = group; pair < group + step; pair++) {
66
- const match = pair + step;
67
- const angle = angleStep * (pair - group);
68
-
69
- const currentCos = Math.cos(angle);
70
- const currentSin = Math.sin(angle);
71
-
72
- const real = currentCos * data[match] - currentSin * data[match + 1];
73
- const imag = currentCos * data[match + 1] + currentSin * data[match];
74
-
75
- data[match] = data[pair] - real;
76
- data[match + 1] = data[pair + 1] - imag;
77
- data[pair] += real;
78
- data[pair + 1] += imag;
79
- }
80
- }
81
- }
82
- };
83
-
84
- // Add realInverse method
85
- FFT.prototype.realInverse = function(powerSpectrum, output) {
86
- const n = powerSpectrum.length;
87
- const complexData = new Float32Array(n * 2);
88
-
89
- // Copy power spectrum to complex format
90
- for (let i = 0; i < n/2 + 1; i++) {
91
- complexData[2 * i] = powerSpectrum[i];
92
- if (2 * i + 1 < complexData.length) {
93
- complexData[2 * i + 1] = 0;
94
- }
95
- }
96
-
97
- // Conjugate for inverse FFT
98
- for (let i = 0; i < n; i++) {
99
- if (2 * i + 1 < complexData.length) {
100
- complexData[2 * i + 1] = -complexData[2 * i + 1];
101
- }
102
- }
103
-
104
- this.transform(complexData);
105
-
106
- // Copy real part to output and scale
107
- for (let i = 0; i < n; i++) {
108
- output[i] = complexData[2 * i] / n;
109
- }
110
- };
111
-
112
- // Add helper functions to match Android
113
- function nextPowerOfTwo(n) {
114
- let value = 1;
115
- while (value < n) {
116
- value *= 2;
117
- }
118
- return value;
119
- }
120
-
121
- function applyHannWindow(samples) {
122
- const output = new Float32Array(samples.length);
123
- for (let i = 0; i < samples.length; i++) {
124
- const multiplier = 0.5 * (1 - Math.cos(2 * Math.PI * i / (samples.length - 1)));
125
- output[i] = samples[i] * multiplier;
126
- }
127
- return output;
128
- }
129
-
130
- // Update spectral feature computation to match Android
131
- function computeSpectralFeatures(segment, sampleRate, featureOptions = {}) {
132
- try {
133
- // Early return if no spectral features are requested
134
- if (!featureOptions.spectralCentroid &&
135
- !featureOptions.spectralFlatness &&
136
- !featureOptions.spectralRollOff &&
137
- !featureOptions.spectralBandwidth &&
138
- !featureOptions.magnitudeSpectrum) {
139
- return {
140
- centroid: 0,
141
- flatness: 0,
142
- rollOff: 0,
143
- bandwidth: 0,
144
- magnitudeSpectrum: []
145
- };
146
- }
147
-
148
- // Ensure we have valid data
149
- if (!segment || segment.length === 0) {
150
- throw new Error('Invalid segment data');
151
- }
152
-
153
- // Process in fixed-size chunks
154
- const chunkSize = N_FFT;
155
- const numChunks = Math.ceil(segment.length / chunkSize);
156
-
157
- let results = {
158
- centroid: 0,
159
- flatness: 0,
160
- rollOff: 0,
161
- bandwidth: 0,
162
- magnitudeSpectrum: new Float32Array(N_FFT / 2 + 1).fill(0)
163
- };
164
-
165
- let validChunks = 0;
166
-
167
- // Iterate through chunks
168
- for (let i = 0; i < numChunks; i++) {
169
- const start = i * chunkSize;
170
- const end = Math.min(start + chunkSize, segment.length);
171
- const chunk = segment.slice(start, end);
172
-
173
- if (chunk.length < N_FFT / 4) continue; // Skip very small chunks
174
-
175
- // Process the chunk
176
- const paddedChunk = new Float32Array(N_FFT);
177
- paddedChunk.set(applyHannWindow(chunk));
178
-
179
- const fft = new FFT(N_FFT);
180
- fft.transform(paddedChunk);
181
-
182
- // Calculate magnitude spectrum
183
- const chunkMagnitudeSpectrum = new Float32Array(N_FFT / 2 + 1);
184
- let hasSignal = false;
185
-
186
- for (let j = 0; j < N_FFT / 2; j++) {
187
- const re = paddedChunk[2 * j];
188
- const im = paddedChunk[2 * j + 1];
189
- const magnitude = Math.sqrt(re * re + im * im);
190
- chunkMagnitudeSpectrum[j] = magnitude;
191
- if (magnitude > Number.EPSILON) hasSignal = true;
192
- }
193
-
194
- if (!hasSignal) continue;
195
- validChunks++;
196
-
197
- // Accumulate results
198
- if (featureOptions.spectralCentroid) {
199
- const centroid = computeSpectralCentroid(chunkMagnitudeSpectrum, sampleRate);
200
- if (!isNaN(centroid)) results.centroid += centroid;
201
- }
202
-
203
- if (featureOptions.spectralFlatness) {
204
- const flatness = computeSpectralFlatness(chunkMagnitudeSpectrum);
205
- if (!isNaN(flatness)) results.flatness += flatness;
206
- }
207
-
208
- if (featureOptions.spectralRollOff) {
209
- const rolloff = computeSpectralRollOff(chunkMagnitudeSpectrum, sampleRate);
210
- if (!isNaN(rolloff)) results.rollOff += rolloff;
211
- }
212
-
213
- if (featureOptions.spectralBandwidth && !isNaN(results.centroid)) {
214
- const bandwidth = computeSpectralBandwidth(chunkMagnitudeSpectrum, sampleRate, results.centroid);
215
- if (!isNaN(bandwidth)) results.bandwidth += bandwidth;
216
- }
217
-
218
- if (featureOptions.magnitudeSpectrum) {
219
- for (let j = 0; j < results.magnitudeSpectrum.length; j++) {
220
- results.magnitudeSpectrum[j] += chunkMagnitudeSpectrum[j];
221
- }
222
- }
223
- }
224
-
225
- // Average the accumulated results
226
- if (validChunks > 0) {
227
- results.centroid /= validChunks;
228
- results.flatness /= validChunks;
229
- results.rollOff /= validChunks;
230
- results.bandwidth /= validChunks;
231
-
232
- if (featureOptions.magnitudeSpectrum) {
233
- for (let i = 0; i < results.magnitudeSpectrum.length; i++) {
234
- results.magnitudeSpectrum[i] /= validChunks;
235
- }
236
- }
237
- }
238
-
239
- return results;
240
- } catch (error) {
241
- console.error('[Worker] Spectral feature computation error:', error);
242
- return {
243
- centroid: 0,
244
- flatness: 0,
245
- rollOff: 0,
246
- bandwidth: 0,
247
- magnitudeSpectrum: []
248
- };
249
- }
250
- }
251
-
252
- function computeSpectralCentroid(magnitudeSpectrum, sampleRate) {
253
- const sum = magnitudeSpectrum.reduce((a, b) => a + (b || 0), 0);
254
- if (sum <= Number.EPSILON) return 0;
255
-
256
- const weightedSum = magnitudeSpectrum.reduce((acc, value, index) =>
257
- acc + (index * (sampleRate / N_FFT) * (value || 0)), 0);
258
-
259
- return weightedSum / sum;
260
- }
261
-
262
- function computeSpectralFlatness(powerSpectrum) {
263
- // Add small epsilon to avoid log(0)
264
- const epsilon = Number.EPSILON;
265
- const validSpectrum = powerSpectrum.map(v => Math.max(v, epsilon));
266
-
267
- const geometricMean = Math.exp(
268
- validSpectrum
269
- .map(v => Math.log(v))
270
- .reduce((a, b) => a + b) / validSpectrum.length
271
- );
272
-
273
- const arithmeticMean =
274
- validSpectrum.reduce((a, b) => a + b) / validSpectrum.length;
275
-
276
- return geometricMean / arithmeticMean;
277
- }
278
-
279
- function computeSpectralRollOff(magnitudeSpectrum, sampleRate) {
280
- const totalEnergy = magnitudeSpectrum.reduce((a, b) => a + b, 0);
281
- const rollOffThreshold = totalEnergy * 0.85;
282
- let cumulativeEnergy = 0;
283
-
284
- for (let i = 0; i < magnitudeSpectrum.length; i++) {
285
- cumulativeEnergy += magnitudeSpectrum[i];
286
- if (cumulativeEnergy >= rollOffThreshold) {
287
- return (i / magnitudeSpectrum.length) * (sampleRate / 2);
288
- }
289
- }
290
-
291
- return 0;
292
- }
293
-
294
- function computeSpectralBandwidth(magnitudeSpectrum, sampleRate, centroid) {
295
- const sum = magnitudeSpectrum.reduce((a, b) => a + (b || 0), 0);
296
- if (sum <= Number.EPSILON) return 0;
297
-
298
- const weightedSum = magnitudeSpectrum.reduce(
299
- (acc, value, index) => {
300
- const freq = index * sampleRate / (2 * magnitudeSpectrum.length);
301
- return acc + (value || 0) * Math.pow(freq - centroid, 2);
302
- }, 0
303
- );
304
-
305
- return Math.sqrt(weightedSum / sum);
306
- }
307
-
308
- function computeChroma(segmentData, sampleRate) {
309
- // Ensure we have valid input data
310
- if (!segmentData || segmentData.length === 0) {
311
- return new Array(N_CHROMA).fill(0);
312
- }
313
-
314
- const fftLength = nextPowerOfTwo(Math.max(segmentData.length, N_FFT));
315
- const windowed = applyHannWindow(segmentData);
316
- const padded = new Float32Array(fftLength);
317
- padded.set(windowed.slice(0, Math.min(windowed.length, fftLength)));
318
-
319
- const fft = new FFT(fftLength);
320
- try {
321
- fft.transform(padded);
322
- } catch (e) {
323
- console.error('[Worker] FFT transform failed in chromagram:', e);
324
- return new Array(N_CHROMA).fill(0);
325
- }
326
-
327
- const chroma = new Float32Array(N_CHROMA).fill(0);
328
- const freqsPerBin = sampleRate / fftLength;
329
- let totalEnergy = 0;
330
-
331
- // First pass: compute magnitudes and total energy
332
- for (let i = 0; i < fftLength / 2; i++) {
333
- const freq = i * freqsPerBin;
334
- if (freq > 20) { // Only consider frequencies above 20 Hz
335
- const re = padded[2 * i];
336
- const im = padded[2 * i + 1] || 0;
337
- const magnitude = Math.sqrt(re * re + im * im);
338
-
339
- if (magnitude > Number.EPSILON) {
340
- // Use a more stable pitch class calculation
341
- const midiNote = 69 + 12 * Math.log2(freq / 440.0);
342
- const pitchClass = Math.round(midiNote) % 12;
343
-
344
- if (pitchClass >= 0 && pitchClass < 12) {
345
- chroma[pitchClass] += magnitude;
346
- totalEnergy += magnitude;
347
- }
348
- }
349
- }
350
- }
351
-
352
- // Normalize chroma values only if we have energy
353
- if (totalEnergy > Number.EPSILON) {
354
- for (let i = 0; i < N_CHROMA; i++) {
355
- chroma[i] = chroma[i] / totalEnergy;
356
- }
357
- }
358
-
359
- // Convert to regular array and ensure no NaN values
360
- return Array.from(chroma, v => isNaN(v) ? 0 : v);
361
- }
362
-
363
- function extractHNR(segmentData) {
364
- const frameSize = segmentData.length;
365
- const autocorrelation = new Float32Array(frameSize);
366
-
367
- // Compute the autocorrelation iteratively
368
- for (let i = 0; i < frameSize; i++) {
369
- let sum = 0;
370
- for (let j = 0; j < frameSize - i; j++) {
371
- sum += segmentData[j] * segmentData[j + i];
372
- }
373
- autocorrelation[i] = sum;
374
- }
375
-
376
- // Find the maximum autocorrelation value iteratively
377
- let maxAutocorrelation = -Infinity;
378
- for (let i = 1; i < autocorrelation.length; i++) {
379
- if (autocorrelation[i] > maxAutocorrelation) {
380
- maxAutocorrelation = autocorrelation[i];
381
- }
382
- }
383
-
384
- // Compute the HNR
385
- return autocorrelation[0] !== 0
386
- ? 10 * Math.log10(maxAutocorrelation / (autocorrelation[0] - maxAutocorrelation))
387
- : 0;
388
- }
389
-
390
- function estimatePitch(segment, sampleRate) {
391
- // Early validation
392
- if (!segment || segment.length < 2 || !sampleRate) return 0;
393
-
394
- try {
395
- // Apply Hann window
396
- const windowed = applyHannWindow(segment);
397
-
398
- // Pad for FFT
399
- const fftLength = nextPowerOfTwo(segment.length * 2);
400
- const padded = new Float32Array(fftLength);
401
- padded.set(windowed);
402
-
403
- // Perform FFT
404
- const fft = new FFT(fftLength);
405
- fft.transform(padded);
406
-
407
- // Compute power spectrum
408
- const powerSpectrum = new Float32Array(fftLength / 2 + 1);
409
- for (let i = 0; i <= fftLength / 2; i++) {
410
- const re = padded[2 * i];
411
- const im = padded[2 * i + 1] || 0;
412
- powerSpectrum[i] = re * re + im * im;
413
- }
414
-
415
- // Find peak frequency
416
- let maxPower = 0;
417
- let peakIndex = 0;
418
- const minFreq = 50; // Minimum frequency to consider (Hz)
419
- const maxFreq = 1000; // Maximum frequency to consider (Hz)
420
- const minBin = Math.floor(minFreq * fftLength / sampleRate);
421
- const maxBin = Math.ceil(maxFreq * fftLength / sampleRate);
422
-
423
- for (let i = minBin; i <= maxBin; i++) {
424
- if (powerSpectrum[i] > maxPower) {
425
- maxPower = powerSpectrum[i];
426
- peakIndex = i;
427
- }
428
- }
429
-
430
- // Convert peak index to frequency
431
- const fundamentalFreq = peakIndex * sampleRate / fftLength;
432
-
433
- // Return 0 if the detected frequency is outside reasonable bounds
434
- return (fundamentalFreq >= minFreq && fundamentalFreq <= maxFreq) ?
435
- fundamentalFreq : 0;
436
-
437
- } catch (error) {
438
- console.error('[Worker] Pitch estimation error:', error);
439
- return 0;
440
- }
441
- }
442
-
443
- // Unique ID counter
444
- let uniqueIdCounter = 0
445
- let accumulatedDataPoints = []
446
- let lastEmitTime = Date.now()
447
-
448
- self.onmessage = function (event) {
449
- // Check if this is a reset command
450
- if (event.data.command === 'resetCounter') {
451
- uniqueIdCounter = event.data.startCounterFrom || 0;
452
- console.log('[Worker] Reset counter to', uniqueIdCounter);
453
- return; // Exit early, don't process audio
454
- }
455
-
456
- // Regular audio processing
457
- const {
458
- channelData,
459
- sampleRate,
460
- segmentDurationMs,
461
- algorithm,
462
- bitDepth,
463
- fullAudioDurationMs,
464
- numberOfChannels,
465
- features: _features,
466
- intervalAnalysis = 500,
467
- enableLogging,
468
- resetCounter,
469
- startCounterFrom,
470
- } = event.data
471
-
472
- // Also handle reset as part of regular message
473
- if (resetCounter) {
474
- uniqueIdCounter = startCounterFrom || 0;
475
- }
476
-
477
- const subChunkStartTime = fullAudioDurationMs / 1000
478
-
479
-
480
- // Create a simple logger that only logs when enabled
481
- const logger = enableLogging ? {
482
- debug: (...args) => console.debug('[Worker]', ...args),
483
- log: (...args) => console.log('[Worker]', ...args),
484
- error: (...args) => console.error('[Worker]', ...args)
485
- } : {
486
- debug: () => {},
487
- log: () => {},
488
- error: () => {}
489
- }
490
- console.log('[Worker] START Feature Extractor - hasData: ' + (event.data ? true : false) + ', channelData: ' + (event.data.channelData ? event.data.channelData.length : 0) + ', fullAudioDurationMs: ' + (event.data.fullAudioDurationMs || 0) + ', sampleRate: ' + (event.data.sampleRate || 0) + ', segmentDurationMs: ' + (event.data.segmentDurationMs || 0) + ', algorithm: ' + (event.data.algorithm || 'none') + ', bitDepth: ' + (event.data.bitDepth || 0) + ', numberOfChannels: ' + (event.data.numberOfChannels || 0) + ', features: ' + (event.data.features ? Object.keys(event.data.features).length : 0) + ', intervalAnalysis: ' + (event.data.intervalAnalysis || 0) + ', dataKeys: ' + (event.data ? Object.keys(event.data).join(',') : ''));
491
-
492
- const features = _features || {}
493
-
494
- const SILENCE_THRESHOLD = 0.01
495
- const MIN_SILENCE_DURATION = 1.5 * sampleRate // 1.5 seconds of silence
496
- const SPEECH_INERTIA_DURATION = 0.1 * sampleRate // Speech inertia duration in samples
497
- const RMS_THRESHOLD = 0.01
498
- const ZCR_THRESHOLD = 0.1
499
-
500
- // Placeholder functions for feature extraction
501
- const extractMFCC = (segmentData, sampleRate) => {
502
- // Implement MFCC extraction logic here
503
- return []
504
- }
505
-
506
- const extractSpectralCentroid = (segmentData, sampleRate) => {
507
- const magnitudeSpectrum = segmentData.map((v) => v * v)
508
- const sum = magnitudeSpectrum.reduce((a, b) => a + b, 0)
509
- if (sum === 0) return 0
510
-
511
- const weightedSum = magnitudeSpectrum.reduce(
512
- (acc, value, index) => acc + index * value,
513
- 0
514
- )
515
- return (
516
- ((weightedSum / sum) * (sampleRate / 2)) / magnitudeSpectrum.length
517
- )
518
- }
519
-
520
- const extractSpectralFlatness = (segmentData) => {
521
- const magnitudeSpectrum = segmentData.map((v) => Math.abs(v))
522
- const geometricMean = Math.exp(
523
- magnitudeSpectrum
524
- .map((v) => Math.log(v + Number.MIN_VALUE))
525
- .reduce((a, b) => a + b) / magnitudeSpectrum.length
526
- )
527
- const arithmeticMean =
528
- magnitudeSpectrum.reduce((a, b) => a + b) / magnitudeSpectrum.length
529
- return arithmeticMean === 0 ? 0 : geometricMean / arithmeticMean
530
- }
531
-
532
- const extractSpectralRollOff = (segmentData, sampleRate) => {
533
- const magnitudeSpectrum = segmentData.map((v) => Math.abs(v))
534
- const totalEnergy = magnitudeSpectrum.reduce((a, b) => a + b, 0)
535
- const rollOffThreshold = totalEnergy * 0.85
536
- let cumulativeEnergy = 0
537
-
538
- for (let i = 0; i < magnitudeSpectrum.length; i++) {
539
- cumulativeEnergy += magnitudeSpectrum[i]
540
- if (cumulativeEnergy >= rollOffThreshold) {
541
- return (i / magnitudeSpectrum.length) * (sampleRate / 2)
542
- }
543
- }
544
-
545
- return 0
546
- }
547
-
548
- const extractSpectralBandwidth = (segmentData, sampleRate) => {
549
- const centroid = extractSpectralCentroid(segmentData, sampleRate)
550
- const magnitudeSpectrum = segmentData.map((v) => Math.abs(v))
551
- const sum = magnitudeSpectrum.reduce((a, b) => a + b, 0)
552
- if (sum === 0) return 0
553
-
554
- const weightedSum = magnitudeSpectrum.reduce(
555
- (acc, value, index) => acc + value * Math.pow(index - centroid, 2),
556
- 0
557
- )
558
- return Math.sqrt(weightedSum / sum)
559
- }
560
-
561
- const extractChromagram = (segmentData, sampleRate) => {
562
- return [] // TODO implement
563
- }
564
-
565
- /**
566
- * Creates a features object based on requested features
567
- */
568
- function createFeaturesObject(
569
- features,
570
- maxAmp,
571
- rms,
572
- sumSquares,
573
- zeroCrossings,
574
- remainingSamples,
575
- spectralFeatures,
576
- channelData,
577
- startIdx,
578
- endIdx,
579
- sampleRate
580
- ) {
581
- // If no features are requested, return undefined
582
- if (!Object.values(features).some(function(v) { return v; })) {
583
- return undefined;
584
- }
585
-
586
- const result = {};
587
-
588
- if (features.energy) {
589
- result.energy = sumSquares;
590
- }
591
- if (features.rms) {
592
- result.rms = rms;
593
- }
594
- // Always include min/max amplitude if any features are requested
595
- result.minAmplitude = -maxAmp;
596
- result.maxAmplitude = maxAmp;
597
-
598
- if (features.zcr) {
599
- result.zcr = zeroCrossings / remainingSamples;
600
- }
601
- if (features.spectralCentroid) {
602
- result.spectralCentroid = spectralFeatures.centroid;
603
- }
604
- if (features.spectralFlatness) {
605
- result.spectralFlatness = spectralFeatures.flatness;
606
- }
607
- if (features.spectralRolloff) {
608
- result.spectralRolloff = spectralFeatures.rollOff;
609
- }
610
- if (features.spectralBandwidth) {
611
- result.spectralBandwidth = spectralFeatures.bandwidth;
612
- }
613
- if (features.chromagram) {
614
- result.chromagram = computeChroma(channelData.slice(startIdx, endIdx), sampleRate);
615
- }
616
- if (features.hnr) {
617
- result.hnr = extractHNR(channelData.slice(startIdx, endIdx));
618
- }
619
- if (features.pitch) {
620
- result.pitch = estimatePitch(channelData.slice(startIdx, endIdx), sampleRate);
621
- }
622
-
623
- return result;
624
- }
625
-
626
- function extractWaveform(
627
- channelData,
628
- sampleRate,
629
- segmentDurationMs
630
- ) {
631
- const logger = enableLogging ? {
632
- debug: (...args) => console.debug('[Worker]', ...args),
633
- log: (...args) => console.log('[Worker]', ...args),
634
- error: (...args) => console.error('[Worker]', ...args)
635
- } : {
636
- debug: () => {},
637
- log: () => {},
638
- error: () => {}
639
- }
640
-
641
- // Calculate amplitude range
642
- let min = Infinity
643
- let max = -Infinity
644
- for (let i = 0; i < channelData.length; i++) {
645
- min = Math.min(min, channelData[i])
646
- max = Math.max(max, channelData[i])
647
- }
648
-
649
- const totalSamples = channelData.length
650
- const durationMs = (totalSamples / sampleRate) * 1000
651
-
652
- // Calculate fixed segment sizes
653
- const samplesPerSegment = Math.floor(sampleRate * (segmentDurationMs / 1000));
654
- const numPoints = Math.floor(totalSamples / samplesPerSegment);
655
- const remainingSamples = totalSamples % samplesPerSegment;
656
-
657
- const dataPoints = []
658
-
659
- // Process full segments
660
- for (let i = 0; i < numPoints; i++) {
661
- const startIdx = i * samplesPerSegment
662
- const endIdx = startIdx + samplesPerSegment
663
-
664
- let sumSquares = 0
665
- let maxAmp = 0
666
- let zeroCrossings = 0
667
-
668
- // Calculate segment features
669
- for (let j = startIdx; j < endIdx; j++) {
670
- const value = channelData[j]
671
- sumSquares += value * value
672
- maxAmp = Math.max(maxAmp, Math.abs(value))
673
- if (j > 0 && value * channelData[j - 1] < 0) {
674
- zeroCrossings++
675
- }
676
- }
677
-
678
- const rms = Math.sqrt(sumSquares / samplesPerSegment)
679
- const startTime = subChunkStartTime + (startIdx / sampleRate)
680
- const endTime = subChunkStartTime + (endIdx / sampleRate)
681
-
682
- var spectralFeatures = computeSpectralFeatures(channelData.slice(startIdx, endIdx), sampleRate, features);
683
-
684
- const dataPoint = {
685
- id: uniqueIdCounter++,
686
- amplitude: maxAmp,
687
- rms,
688
- startTime,
689
- endTime,
690
- dB: 20 * Math.log10(rms + 1e-6),
691
- silent: rms < 0.01,
692
- startPosition: startIdx * 2,
693
- endPosition: endIdx * 2,
694
- samples: samplesPerSegment,
695
- }
696
-
697
- // Extract features if any are requested
698
- const extractedFeatures = createFeaturesObject(
699
- features,
700
- maxAmp,
701
- rms,
702
- sumSquares,
703
- zeroCrossings,
704
- samplesPerSegment,
705
- spectralFeatures,
706
- channelData,
707
- startIdx,
708
- endIdx,
709
- sampleRate
710
- );
711
-
712
- if (extractedFeatures) {
713
- dataPoint.features = extractedFeatures;
714
- }
715
-
716
- dataPoints.push(dataPoint)
717
- }
718
-
719
- // Handle remaining samples if they exist and are enough to process
720
- if (remainingSamples > samplesPerSegment / 4) { // Only process if we have at least 1/4 of a segment
721
- const startIdx = numPoints * samplesPerSegment
722
- const endIdx = totalSamples
723
-
724
- let sumSquares = 0
725
- let maxAmp = 0
726
- let zeroCrossings = 0
727
-
728
- for (let j = startIdx; j < endIdx; j++) {
729
- const value = channelData[j]
730
- sumSquares += value * value
731
- maxAmp = Math.max(maxAmp, Math.abs(value))
732
- if (j > 0 && value * channelData[j - 1] < 0) {
733
- zeroCrossings++
734
- }
735
- }
736
-
737
- const rms = Math.sqrt(sumSquares / remainingSamples)
738
- const startTime = startIdx / sampleRate;
739
- const endTime = endIdx / sampleRate;
740
-
741
- var spectralFeatures = computeSpectralFeatures(channelData.slice(startIdx, endIdx), sampleRate, features);
742
-
743
- const dataPoint = {
744
- id: uniqueIdCounter++,
745
- amplitude: maxAmp,
746
- rms,
747
- startTime,
748
- endTime,
749
- dB: 20 * Math.log10(rms + 1e-6),
750
- silent: rms < 0.01,
751
- startPosition: startIdx * 2,
752
- endPosition: endIdx * 2,
753
- samples: remainingSamples,
754
- }
755
-
756
- // Extract features if any are requested
757
- const extractedFeatures = createFeaturesObject(
758
- features,
759
- maxAmp,
760
- rms,
761
- sumSquares,
762
- zeroCrossings,
763
- remainingSamples,
764
- spectralFeatures,
765
- channelData,
766
- startIdx,
767
- endIdx,
768
- sampleRate
769
- );
770
-
771
- if (extractedFeatures) {
772
- dataPoint.features = extractedFeatures;
773
- }
774
-
775
- dataPoints.push(dataPoint)
776
- }
777
-
778
- return {
779
- durationMs,
780
- dataPoints,
781
- amplitudeRange: { min, max },
782
- rmsRange: {
783
- min: 0,
784
- max: Math.max(Math.abs(min), Math.abs(max))
785
- },
786
- extractionTimeMs: Date.now() - lastEmitTime
787
- }
788
- }
789
-
790
- try {
791
- const result = extractWaveform(
792
- channelData,
793
- sampleRate,
794
- segmentDurationMs
795
- )
796
-
797
- // Send complete result immediately
798
- self.postMessage({
799
- command: 'features',
800
- result: {
801
- bitDepth,
802
- samples: channelData.length,
803
- numberOfChannels,
804
- sampleRate,
805
- segmentDurationMs,
806
- durationMs: result.durationMs,
807
- dataPoints: result.dataPoints,
808
- amplitudeRange: result.amplitudeRange,
809
- rmsRange: result.rmsRange,
810
- }
811
- })
812
- } catch (error) {
813
- console.error('[Worker] Error', {
814
- message: error.message,
815
- stack: error.stack
816
- });
817
-
818
- self.postMessage({
819
- error: {
820
- message: error.message,
821
- stack: error.stack,
822
- name: error.name
823
- }
824
- });
825
- }
826
- }
827
- `;
828
- //# sourceMappingURL=InlineFeaturesExtractor.web.js.map