@siteed/expo-audio-stream 1.0.2 → 1.0.5
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.size-limit.json +6 -0
- package/README.md +18 -176
- package/android/src/main/java/net/siteed/audiostream/AudioRecorderManager.kt +1 -0
- package/app.plugin.js +1 -1
- package/build/AudioAnalysis/AudioAnalysis.types.d.ts +74 -0
- package/build/AudioAnalysis/AudioAnalysis.types.d.ts.map +1 -0
- package/build/AudioAnalysis/AudioAnalysis.types.js +3 -0
- package/build/AudioAnalysis/AudioAnalysis.types.js.map +1 -0
- package/build/AudioAnalysis/extractAudioAnalysis.d.ts +20 -0
- package/build/AudioAnalysis/extractAudioAnalysis.d.ts.map +1 -0
- package/build/AudioAnalysis/extractAudioAnalysis.js +88 -0
- package/build/AudioAnalysis/extractAudioAnalysis.js.map +1 -0
- package/build/AudioAnalysis/extractWaveform.d.ts +8 -0
- package/build/AudioAnalysis/extractWaveform.d.ts.map +1 -0
- package/build/AudioAnalysis/extractWaveform.js +14 -0
- package/build/AudioAnalysis/extractWaveform.js.map +1 -0
- package/build/AudioRecorder.provider.d.ts +15 -2
- package/build/AudioRecorder.provider.d.ts.map +1 -1
- package/build/AudioRecorder.provider.js +21 -8
- package/build/AudioRecorder.provider.js.map +1 -1
- package/build/ExpoAudioStream.native.d.ts.map +1 -1
- package/build/ExpoAudioStream.native.js +2 -2
- package/build/ExpoAudioStream.native.js.map +1 -1
- package/build/ExpoAudioStream.types.d.ts +33 -89
- package/build/ExpoAudioStream.types.d.ts.map +1 -1
- package/build/ExpoAudioStream.types.js.map +1 -1
- package/build/ExpoAudioStream.web.d.ts +10 -9
- package/build/ExpoAudioStream.web.d.ts.map +1 -1
- package/build/ExpoAudioStream.web.js +44 -25
- package/build/ExpoAudioStream.web.js.map +1 -1
- package/build/ExpoAudioStreamModule.d.ts.map +1 -1
- package/build/ExpoAudioStreamModule.js +13 -8
- package/build/ExpoAudioStreamModule.js.map +1 -1
- package/build/{WebRecorder.d.ts → WebRecorder.web.d.ts} +13 -9
- package/build/WebRecorder.web.d.ts.map +1 -0
- package/build/{WebRecorder.js → WebRecorder.web.js} +118 -63
- package/build/WebRecorder.web.js.map +1 -0
- package/build/constants.d.ts +11 -0
- package/build/constants.d.ts.map +1 -0
- package/build/constants.js +14 -0
- package/build/constants.js.map +1 -0
- package/build/events.d.ts +18 -0
- package/build/events.d.ts.map +1 -0
- package/build/events.js +15 -0
- package/build/events.js.map +1 -0
- package/build/index.d.ts +9 -17
- package/build/index.d.ts.map +1 -1
- package/build/index.js +7 -113
- package/build/index.js.map +1 -1
- package/build/logger.d.ts +9 -0
- package/build/logger.d.ts.map +1 -0
- package/build/logger.js +13 -0
- package/build/logger.js.map +1 -0
- package/build/useAudioRecorder.d.ts +20 -0
- package/build/useAudioRecorder.d.ts.map +1 -0
- package/build/{useAudioRecording.js → useAudioRecorder.js} +90 -86
- package/build/useAudioRecorder.js.map +1 -0
- package/build/utils/BlobFix.d.ts +9 -0
- package/build/utils/BlobFix.d.ts.map +1 -0
- package/build/utils/BlobFix.js +494 -0
- package/build/utils/BlobFix.js.map +1 -0
- package/build/utils/concatenateBuffers.d.ts +8 -0
- package/build/utils/concatenateBuffers.d.ts.map +1 -0
- package/build/utils/concatenateBuffers.js +21 -0
- package/build/utils/concatenateBuffers.js.map +1 -0
- package/build/utils/convertPCMToFloat32.d.ts +11 -0
- package/build/utils/convertPCMToFloat32.d.ts.map +1 -0
- package/build/utils/convertPCMToFloat32.js +54 -0
- package/build/utils/convertPCMToFloat32.js.map +1 -0
- package/build/utils/encodingToBitDepth.d.ts +5 -0
- package/build/utils/encodingToBitDepth.d.ts.map +1 -0
- package/build/utils/encodingToBitDepth.js +13 -0
- package/build/utils/encodingToBitDepth.js.map +1 -0
- package/build/utils/getWavFileInfo.d.ts +26 -0
- package/build/utils/getWavFileInfo.d.ts.map +1 -0
- package/build/utils/getWavFileInfo.js +92 -0
- package/build/utils/getWavFileInfo.js.map +1 -0
- package/build/utils/writeWavHeader.d.ts +9 -0
- package/build/utils/writeWavHeader.d.ts.map +1 -0
- package/build/utils/writeWavHeader.js +41 -0
- package/build/utils/writeWavHeader.js.map +1 -0
- package/build/workers/InlineFeaturesExtractor.web.d.ts +2 -0
- package/build/workers/InlineFeaturesExtractor.web.d.ts.map +1 -0
- package/build/workers/InlineFeaturesExtractor.web.js +303 -0
- package/build/workers/InlineFeaturesExtractor.web.js.map +1 -0
- package/build/workers/inlineAudioWebWorker.web.d.ts +2 -0
- package/build/workers/inlineAudioWebWorker.web.d.ts.map +1 -0
- package/build/workers/inlineAudioWebWorker.web.js +243 -0
- package/build/workers/inlineAudioWebWorker.web.js.map +1 -0
- package/expo-module.config.json +8 -17
- package/ios/AudioStreamManager.swift +40 -2
- package/ios/ExpoAudioStreamModule.swift +11 -0
- package/ios/RecordingResult.swift +1 -0
- package/package.json +72 -64
- package/plugin/build/index.d.ts +1 -1
- package/plugin/build/index.js +7 -7
- package/plugin/src/index.ts +47 -47
- package/plugin/tsconfig.json +8 -13
- package/publish.sh +0 -0
- package/src/AudioAnalysis/AudioAnalysis.types.ts +84 -0
- package/src/AudioAnalysis/extractAudioAnalysis.ts +147 -0
- package/src/AudioAnalysis/extractWaveform.ts +25 -0
- package/src/AudioRecorder.provider.tsx +59 -31
- package/src/ExpoAudioStream.native.ts +2 -2
- package/src/ExpoAudioStream.types.ts +58 -116
- package/src/ExpoAudioStream.web.ts +233 -205
- package/src/ExpoAudioStreamModule.ts +18 -12
- package/src/WebRecorder.web.ts +433 -0
- package/src/constants.ts +18 -0
- package/src/events.ts +39 -0
- package/src/index.ts +15 -176
- package/src/logger.ts +23 -0
- package/src/useAudioRecorder.tsx +420 -0
- package/src/utils/BlobFix.ts +550 -0
- package/src/utils/concatenateBuffers.ts +24 -0
- package/src/utils/convertPCMToFloat32.ts +75 -0
- package/src/utils/encodingToBitDepth.ts +18 -0
- package/src/utils/getWavFileInfo.ts +132 -0
- package/src/utils/writeWavHeader.ts +56 -0
- package/src/workers/InlineFeaturesExtractor.web.tsx +302 -0
- package/src/workers/inlineAudioWebWorker.web.tsx +242 -0
- package/tsconfig.json +12 -7
- package/build/WebRecorder.d.ts.map +0 -1
- package/build/WebRecorder.js.map +0 -1
- package/build/inlineAudioWebWorker.d.ts +0 -3
- package/build/inlineAudioWebWorker.d.ts.map +0 -1
- package/build/inlineAudioWebWorker.js +0 -340
- package/build/inlineAudioWebWorker.js.map +0 -1
- package/build/useAudioRecording.d.ts +0 -38
- package/build/useAudioRecording.d.ts.map +0 -1
- package/build/useAudioRecording.js.map +0 -1
- package/build/utils.d.ts +0 -31
- package/build/utils.d.ts.map +0 -1
- package/build/utils.js +0 -143
- package/build/utils.js.map +0 -1
- package/src/WebRecorder.ts +0 -364
- package/src/inlineAudioWebWorker.tsx +0 -340
- package/src/useAudioRecording.tsx +0 -410
- package/src/utils.ts +0 -189
|
@@ -0,0 +1,11 @@
|
|
|
1
|
+
export declare const WAV_HEADER_SIZE = 44;
|
|
2
|
+
export declare const convertPCMToFloat32: ({ bitDepth, buffer, skipWavHeader, }: {
|
|
3
|
+
buffer: ArrayBuffer;
|
|
4
|
+
bitDepth: number;
|
|
5
|
+
skipWavHeader?: boolean;
|
|
6
|
+
}) => Promise<{
|
|
7
|
+
pcmValues: Float32Array;
|
|
8
|
+
min: number;
|
|
9
|
+
max: number;
|
|
10
|
+
}>;
|
|
11
|
+
//# sourceMappingURL=convertPCMToFloat32.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"convertPCMToFloat32.d.ts","sourceRoot":"","sources":["../../src/utils/convertPCMToFloat32.ts"],"names":[],"mappings":"AAGA,eAAO,MAAM,eAAe,KAAK,CAAA;AA8BjC,eAAO,MAAM,mBAAmB,yCAI7B;IACC,MAAM,EAAE,WAAW,CAAA;IACnB,QAAQ,EAAE,MAAM,CAAA;IAChB,aAAa,CAAC,EAAE,OAAO,CAAA;CAC1B,KAAG,OAAO,CAAC;IAAE,SAAS,EAAE,YAAY,CAAC;IAAC,GAAG,EAAE,MAAM,CAAC;IAAC,GAAG,EAAE,MAAM,CAAA;CAAE,CAiChE,CAAA"}
|
|
@@ -0,0 +1,54 @@
|
|
|
1
|
+
import { getWavFileInfo } from './getWavFileInfo';
|
|
2
|
+
import { getLogger } from '../logger';
|
|
3
|
+
export const WAV_HEADER_SIZE = 44;
|
|
4
|
+
const logger = getLogger('convertPCMToFloat32');
|
|
5
|
+
const convertSample = (dataView, offset, bitDepth) => {
|
|
6
|
+
switch (bitDepth) {
|
|
7
|
+
case 8:
|
|
8
|
+
return (dataView.getUint8(offset) - 128) / 128;
|
|
9
|
+
case 16:
|
|
10
|
+
return dataView.getInt16(offset, true) / 32768;
|
|
11
|
+
case 24:
|
|
12
|
+
return (((dataView.getUint8(offset) |
|
|
13
|
+
(dataView.getUint8(offset + 1) << 8) |
|
|
14
|
+
(dataView.getUint8(offset + 2) << 16)) /
|
|
15
|
+
8388608) *
|
|
16
|
+
2 -
|
|
17
|
+
1);
|
|
18
|
+
case 32:
|
|
19
|
+
return dataView.getFloat32(offset, true);
|
|
20
|
+
default:
|
|
21
|
+
throw new Error(`Unsupported bit depth: ${bitDepth}`);
|
|
22
|
+
}
|
|
23
|
+
};
|
|
24
|
+
export const convertPCMToFloat32 = async ({ bitDepth, buffer, skipWavHeader = false, }) => {
|
|
25
|
+
try {
|
|
26
|
+
logger.debug(`Converting PCM to Float32: bitDepth: ${bitDepth}, buffer.byteLength: ${buffer.byteLength}`);
|
|
27
|
+
const dataView = new DataView(buffer);
|
|
28
|
+
let headerOffset = 0;
|
|
29
|
+
if (skipWavHeader) {
|
|
30
|
+
const wavFileInfo = await getWavFileInfo(buffer);
|
|
31
|
+
headerOffset = wavFileInfo.dataChunkOffset;
|
|
32
|
+
}
|
|
33
|
+
const dataLength = buffer.byteLength - headerOffset;
|
|
34
|
+
const sampleLength = Math.floor(dataLength / (bitDepth / 8));
|
|
35
|
+
const float32Array = new Float32Array(sampleLength);
|
|
36
|
+
let min = Infinity;
|
|
37
|
+
let max = -Infinity;
|
|
38
|
+
for (let i = 0; i < sampleLength; i++) {
|
|
39
|
+
const offset = headerOffset + i * (bitDepth / 8);
|
|
40
|
+
const value = convertSample(dataView, offset, bitDepth);
|
|
41
|
+
if (value < min)
|
|
42
|
+
min = value;
|
|
43
|
+
if (value > max)
|
|
44
|
+
max = value;
|
|
45
|
+
float32Array[i] = value;
|
|
46
|
+
}
|
|
47
|
+
return { pcmValues: float32Array, min, max };
|
|
48
|
+
}
|
|
49
|
+
catch (error) {
|
|
50
|
+
logger.error(`Error converting PCM to Float32`, error);
|
|
51
|
+
return { pcmValues: new Float32Array(), min: 0, max: 0 };
|
|
52
|
+
}
|
|
53
|
+
};
|
|
54
|
+
//# sourceMappingURL=convertPCMToFloat32.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"convertPCMToFloat32.js","sourceRoot":"","sources":["../../src/utils/convertPCMToFloat32.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,cAAc,EAAe,MAAM,kBAAkB,CAAA;AAC9D,OAAO,EAAE,SAAS,EAAE,MAAM,WAAW,CAAA;AAErC,MAAM,CAAC,MAAM,eAAe,GAAG,EAAE,CAAA;AAEjC,MAAM,MAAM,GAAG,SAAS,CAAC,qBAAqB,CAAC,CAAA;AAE/C,MAAM,aAAa,GAAG,CAClB,QAAkB,EAClB,MAAc,EACd,QAAgB,EACV,EAAE;IACR,QAAQ,QAAQ,EAAE,CAAC;QACf,KAAK,CAAC;YACF,OAAO,CAAC,QAAQ,CAAC,QAAQ,CAAC,MAAM,CAAC,GAAG,GAAG,CAAC,GAAG,GAAG,CAAA;QAClD,KAAK,EAAE;YACH,OAAO,QAAQ,CAAC,QAAQ,CAAC,MAAM,EAAE,IAAI,CAAC,GAAG,KAAK,CAAA;QAClD,KAAK,EAAE;YACH,OAAO,CACH,CAAC,CAAC,QAAQ,CAAC,QAAQ,CAAC,MAAM,CAAC;gBACvB,CAAC,QAAQ,CAAC,QAAQ,CAAC,MAAM,GAAG,CAAC,CAAC,IAAI,CAAC,CAAC;gBACpC,CAAC,QAAQ,CAAC,QAAQ,CAAC,MAAM,GAAG,CAAC,CAAC,IAAI,EAAE,CAAC,CAAC;gBACtC,OAAO,CAAC;gBACR,CAAC;gBACL,CAAC,CACJ,CAAA;QACL,KAAK,EAAE;YACH,OAAO,QAAQ,CAAC,UAAU,CAAC,MAAM,EAAE,IAAI,CAAC,CAAA;QAC5C;YACI,MAAM,IAAI,KAAK,CAAC,0BAA0B,QAAQ,EAAE,CAAC,CAAA;IAC7D,CAAC;AACL,CAAC,CAAA;AAED,MAAM,CAAC,MAAM,mBAAmB,GAAG,KAAK,EAAE,EACtC,QAAQ,EACR,MAAM,EACN,aAAa,GAAG,KAAK,GAKxB,EAAkE,EAAE;IACjE,IAAI,CAAC;QACD,MAAM,CAAC,KAAK,CACR,wCAAwC,QAAQ,wBAAwB,MAAM,CAAC,UAAU,EAAE,CAC9F,CAAA;QACD,MAAM,QAAQ,GAAG,IAAI,QAAQ,CAAC,MAAM,CAAC,CAAA;QACrC,IAAI,YAAY,GAAG,CAAC,CAAA;QACpB,IAAI,aAAa,EAAE,CAAC;YAChB,MAAM,WAAW,GAAgB,MAAM,cAAc,CAAC,MAAM,CAAC,CAAA;YAC7D,YAAY,GAAG,WAAW,CAAC,eAAe,CAAA;QAC9C,CAAC;QAED,MAAM,UAAU,GAAG,MAAM,CAAC,UAAU,GAAG,YAAY,CAAA;QACnD,MAAM,YAAY,GAAG,IAAI,CAAC,KAAK,CAAC,UAAU,GAAG,CAAC,QAAQ,GAAG,CAAC,CAAC,CAAC,CAAA;QAC5D,MAAM,YAAY,GAAG,IAAI,YAAY,CAAC,YAAY,CAAC,CAAA;QACnD,IAAI,GAAG,GAAG,QAAQ,CAAA;QAClB,IAAI,GAAG,GAAG,CAAC,QAAQ,CAAA;QAEnB,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,GAAG,YAAY,EAAE,CAAC,EAAE,EAAE,CAAC;YACpC,MAAM,MAAM,GAAG,YAAY,GAAG,CAAC,GAAG,CAAC,QAAQ,GAAG,CAAC,CAAC,CAAA;YAChD,MAAM,KAAK,GAAG,aAAa,CAAC,QAAQ,EAAE,MAAM,EAAE,QAAQ,CAAC,CAAA;YAEvD,IAAI,KAAK,GAAG,GAAG;gBAAE,GAAG,GAAG,KAAK,CAAA;YAC5B,IAAI,KAAK,GAAG,GAAG;gBAAE,GAAG,GAAG,KAAK,CAAA;YAE5B,YAAY,CAAC,CAAC,CAAC,GAAG,KAAK,CAAA;QAC3B,CAAC;QAED,OAAO,EAAE,SAAS,EAAE,YAAY,EAAE,GAAG,EAAE,GAAG,EAAE,CAAA;IAChD,CAAC;IAAC,OAAO,KAAc,EAAE,CAAC;QACtB,MAAM,CAAC,KAAK,CAAC,iCAAiC,EAAE,KAAK,CAAC,CAAA;QACtD,OAAO,EAAE,SAAS,EAAE,IAAI,YAAY,EAAE,EAAE,GAAG,EAAE,CAAC,EAAE,GAAG,EAAE,CAAC,EAAE,CAAA;IAC5D,CAAC;AACL,CAAC,CAAA","sourcesContent":["import { getWavFileInfo, WavFileInfo } from './getWavFileInfo'\nimport { getLogger } from '../logger'\n\nexport const WAV_HEADER_SIZE = 44\n\nconst logger = getLogger('convertPCMToFloat32')\n\nconst convertSample = (\n dataView: DataView,\n offset: number,\n bitDepth: number\n): number => {\n switch (bitDepth) {\n case 8:\n return (dataView.getUint8(offset) - 128) / 128\n case 16:\n return dataView.getInt16(offset, true) / 32768\n case 24:\n return (\n ((dataView.getUint8(offset) |\n (dataView.getUint8(offset + 1) << 8) |\n (dataView.getUint8(offset + 2) << 16)) /\n 8388608) *\n 2 -\n 1\n )\n case 32:\n return dataView.getFloat32(offset, true)\n default:\n throw new Error(`Unsupported bit depth: ${bitDepth}`)\n }\n}\n\nexport const convertPCMToFloat32 = async ({\n bitDepth,\n buffer,\n skipWavHeader = false,\n}: {\n buffer: ArrayBuffer\n bitDepth: number\n skipWavHeader?: boolean\n}): Promise<{ pcmValues: Float32Array; min: number; max: number }> => {\n try {\n logger.debug(\n `Converting PCM to Float32: bitDepth: ${bitDepth}, buffer.byteLength: ${buffer.byteLength}`\n )\n const dataView = new DataView(buffer)\n let headerOffset = 0\n if (skipWavHeader) {\n const wavFileInfo: WavFileInfo = await getWavFileInfo(buffer)\n headerOffset = wavFileInfo.dataChunkOffset\n }\n\n const dataLength = buffer.byteLength - headerOffset\n const sampleLength = Math.floor(dataLength / (bitDepth / 8))\n const float32Array = new Float32Array(sampleLength)\n let min = Infinity\n let max = -Infinity\n\n for (let i = 0; i < sampleLength; i++) {\n const offset = headerOffset + i * (bitDepth / 8)\n const value = convertSample(dataView, offset, bitDepth)\n\n if (value < min) min = value\n if (value > max) max = value\n\n float32Array[i] = value\n }\n\n return { pcmValues: float32Array, min, max }\n } catch (error: unknown) {\n logger.error(`Error converting PCM to Float32`, error)\n return { pcmValues: new Float32Array(), min: 0, max: 0 }\n }\n}\n"]}
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"encodingToBitDepth.d.ts","sourceRoot":"","sources":["../../src/utils/encodingToBitDepth.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,QAAQ,EAAE,YAAY,EAAE,MAAM,0BAA0B,CAAA;AAEjE,eAAO,MAAM,kBAAkB,kBAE5B;IACC,QAAQ,EAAE,YAAY,CAAA;CACzB,KAAG,QAWH,CAAA"}
|
|
@@ -0,0 +1,13 @@
|
|
|
1
|
+
export const encodingToBitDepth = ({ encoding, }) => {
|
|
2
|
+
switch (encoding) {
|
|
3
|
+
case 'pcm_32bit':
|
|
4
|
+
return 32;
|
|
5
|
+
case 'pcm_16bit':
|
|
6
|
+
return 16;
|
|
7
|
+
case 'pcm_8bit':
|
|
8
|
+
return 8;
|
|
9
|
+
default:
|
|
10
|
+
throw new Error(`Unsupported encoding type: ${encoding}`);
|
|
11
|
+
}
|
|
12
|
+
};
|
|
13
|
+
//# sourceMappingURL=encodingToBitDepth.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"encodingToBitDepth.js","sourceRoot":"","sources":["../../src/utils/encodingToBitDepth.ts"],"names":[],"mappings":"AAEA,MAAM,CAAC,MAAM,kBAAkB,GAAG,CAAC,EAC/B,QAAQ,GAGX,EAAY,EAAE;IACX,QAAQ,QAAQ,EAAE,CAAC;QACf,KAAK,WAAW;YACZ,OAAO,EAAE,CAAA;QACb,KAAK,WAAW;YACZ,OAAO,EAAE,CAAA;QACb,KAAK,UAAU;YACX,OAAO,CAAC,CAAA;QACZ;YACI,MAAM,IAAI,KAAK,CAAC,8BAA8B,QAAQ,EAAE,CAAC,CAAA;IACjE,CAAC;AACL,CAAC,CAAA","sourcesContent":["import { BitDepth, EncodingType } from '../ExpoAudioStream.types'\n\nexport const encodingToBitDepth = ({\n encoding,\n}: {\n encoding: EncodingType\n}): BitDepth => {\n switch (encoding) {\n case 'pcm_32bit':\n return 32\n case 'pcm_16bit':\n return 16\n case 'pcm_8bit':\n return 8\n default:\n throw new Error(`Unsupported encoding type: ${encoding}`)\n }\n}\n"]}
|
|
@@ -0,0 +1,26 @@
|
|
|
1
|
+
import { BitDepth, SampleRate } from '../ExpoAudioStream.types';
|
|
2
|
+
/**
|
|
3
|
+
* Interface representing the metadata of a WAV file.
|
|
4
|
+
*/
|
|
5
|
+
export interface WavFileInfo {
|
|
6
|
+
sampleRate: SampleRate;
|
|
7
|
+
numChannels: number;
|
|
8
|
+
bitDepth: BitDepth;
|
|
9
|
+
size: number;
|
|
10
|
+
durationMs: number;
|
|
11
|
+
audioFormatDescription: string;
|
|
12
|
+
byteRate: number;
|
|
13
|
+
blockAlign: number;
|
|
14
|
+
creationDateTime?: string;
|
|
15
|
+
comments?: string;
|
|
16
|
+
compressionType?: string;
|
|
17
|
+
dataChunkOffset: number;
|
|
18
|
+
}
|
|
19
|
+
/**
|
|
20
|
+
* Extracts metadata from a WAV buffer.
|
|
21
|
+
*
|
|
22
|
+
* @param arrayBuffer - The array buffer containing the WAV data.
|
|
23
|
+
* @returns A promise that resolves to the extracted metadata.
|
|
24
|
+
*/
|
|
25
|
+
export declare const getWavFileInfo: (arrayBuffer: ArrayBuffer) => Promise<WavFileInfo>;
|
|
26
|
+
//# sourceMappingURL=getWavFileInfo.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"getWavFileInfo.d.ts","sourceRoot":"","sources":["../../src/utils/getWavFileInfo.ts"],"names":[],"mappings":"AAEA,OAAO,EAAE,QAAQ,EAAE,UAAU,EAAE,MAAM,0BAA0B,CAAA;AAoB/D;;GAEG;AACH,MAAM,WAAW,WAAW;IACxB,UAAU,EAAE,UAAU,CAAA;IACtB,WAAW,EAAE,MAAM,CAAA;IACnB,QAAQ,EAAE,QAAQ,CAAA;IAClB,IAAI,EAAE,MAAM,CAAA;IACZ,UAAU,EAAE,MAAM,CAAA;IAClB,sBAAsB,EAAE,MAAM,CAAA;IAC9B,QAAQ,EAAE,MAAM,CAAA;IAChB,UAAU,EAAE,MAAM,CAAA;IAClB,gBAAgB,CAAC,EAAE,MAAM,CAAA;IACzB,QAAQ,CAAC,EAAE,MAAM,CAAA;IACjB,eAAe,CAAC,EAAE,MAAM,CAAA;IACxB,eAAe,EAAE,MAAM,CAAA;CAC1B;AAED;;;;;GAKG;AACH,eAAO,MAAM,cAAc,gBACV,WAAW,KACzB,OAAO,CAAC,WAAW,CAmFrB,CAAA"}
|
|
@@ -0,0 +1,92 @@
|
|
|
1
|
+
// packages/expo-audio-stream/src/utils/getWavFileInfo.ts
|
|
2
|
+
import { DATA_CHUNK_ID, DEFAULT_BIT_DEPTH, DEFAULT_SAMPLE_RATE, FMT_CHUNK_ID, INFO_CHUNK_ID, RIFF_HEADER, WAVE_HEADER, } from '../constants';
|
|
3
|
+
// Audio format descriptions
|
|
4
|
+
const AUDIO_FORMATS = {
|
|
5
|
+
1: 'PCM',
|
|
6
|
+
3: 'IEEE float',
|
|
7
|
+
6: '8-bit ITU-T G.711 A-law',
|
|
8
|
+
7: '8-bit ITU-T G.711 µ-law',
|
|
9
|
+
65534: 'WAVE_FORMAT_EXTENSIBLE',
|
|
10
|
+
};
|
|
11
|
+
/**
|
|
12
|
+
* Extracts metadata from a WAV buffer.
|
|
13
|
+
*
|
|
14
|
+
* @param arrayBuffer - The array buffer containing the WAV data.
|
|
15
|
+
* @returns A promise that resolves to the extracted metadata.
|
|
16
|
+
*/
|
|
17
|
+
export const getWavFileInfo = async (arrayBuffer) => {
|
|
18
|
+
const view = new DataView(arrayBuffer);
|
|
19
|
+
// Check if the file is a valid RIFF/WAVE file
|
|
20
|
+
const riffHeader = view.getUint32(0, false);
|
|
21
|
+
const waveHeader = view.getUint32(8, false);
|
|
22
|
+
if (riffHeader !== RIFF_HEADER || waveHeader !== WAVE_HEADER) {
|
|
23
|
+
throw new Error('Invalid WAV file');
|
|
24
|
+
}
|
|
25
|
+
// Initialize variables for the metadata
|
|
26
|
+
let fmtChunkOffset = 12;
|
|
27
|
+
let sampleRate = DEFAULT_SAMPLE_RATE;
|
|
28
|
+
let numChannels = 0;
|
|
29
|
+
let bitDepth = DEFAULT_BIT_DEPTH;
|
|
30
|
+
let dataChunkSize = 0;
|
|
31
|
+
let audioFormat = 0;
|
|
32
|
+
let byteRate = 0;
|
|
33
|
+
let blockAlign = 0;
|
|
34
|
+
let creationDateTime = '';
|
|
35
|
+
let comments = '';
|
|
36
|
+
let dataChunkOffset = 0;
|
|
37
|
+
// Parse chunks to find the "fmt " and "data" chunks
|
|
38
|
+
while (fmtChunkOffset < view.byteLength) {
|
|
39
|
+
const chunkId = view.getUint32(fmtChunkOffset, false);
|
|
40
|
+
const chunkSize = view.getUint32(fmtChunkOffset + 4, true);
|
|
41
|
+
if (chunkId === FMT_CHUNK_ID) {
|
|
42
|
+
// "fmt "
|
|
43
|
+
audioFormat = view.getUint16(fmtChunkOffset + 8, true);
|
|
44
|
+
if (!AUDIO_FORMATS[audioFormat]) {
|
|
45
|
+
throw new Error('Unsupported WAV file format');
|
|
46
|
+
}
|
|
47
|
+
numChannels = view.getUint16(fmtChunkOffset + 10, true);
|
|
48
|
+
sampleRate = view.getUint32(fmtChunkOffset + 12, true);
|
|
49
|
+
byteRate = view.getUint32(fmtChunkOffset + 16, true);
|
|
50
|
+
blockAlign = view.getUint16(fmtChunkOffset + 20, true);
|
|
51
|
+
bitDepth = view.getUint16(fmtChunkOffset + 22, true);
|
|
52
|
+
}
|
|
53
|
+
else if (chunkId === DATA_CHUNK_ID) {
|
|
54
|
+
// "data"
|
|
55
|
+
dataChunkSize = chunkSize;
|
|
56
|
+
dataChunkOffset = fmtChunkOffset + 8; // Position after chunk header
|
|
57
|
+
break;
|
|
58
|
+
}
|
|
59
|
+
else if (chunkId === INFO_CHUNK_ID) {
|
|
60
|
+
// "INFO"
|
|
61
|
+
// Read INFO chunk (assuming it contains a text-based creation date/time and comments)
|
|
62
|
+
const infoStart = fmtChunkOffset + 8;
|
|
63
|
+
const infoText = new TextDecoder().decode(new Uint8Array(arrayBuffer.slice(infoStart, infoStart + chunkSize)));
|
|
64
|
+
const infoParts = infoText.split('\0');
|
|
65
|
+
creationDateTime = infoParts[0];
|
|
66
|
+
comments = infoParts[1];
|
|
67
|
+
}
|
|
68
|
+
fmtChunkOffset += 8 + chunkSize;
|
|
69
|
+
}
|
|
70
|
+
if (!sampleRate || !numChannels || !bitDepth || !dataChunkSize) {
|
|
71
|
+
throw new Error('Incomplete WAV file information');
|
|
72
|
+
}
|
|
73
|
+
// Calculate duration
|
|
74
|
+
const bytesPerSample = bitDepth / 8;
|
|
75
|
+
const numSamples = dataChunkSize / (numChannels * bytesPerSample);
|
|
76
|
+
const durationMs = (numSamples / sampleRate) * 1000;
|
|
77
|
+
return {
|
|
78
|
+
sampleRate,
|
|
79
|
+
numChannels,
|
|
80
|
+
bitDepth,
|
|
81
|
+
size: arrayBuffer.byteLength,
|
|
82
|
+
durationMs,
|
|
83
|
+
audioFormatDescription: AUDIO_FORMATS[audioFormat],
|
|
84
|
+
byteRate,
|
|
85
|
+
blockAlign,
|
|
86
|
+
creationDateTime: creationDateTime || undefined,
|
|
87
|
+
comments: comments || undefined,
|
|
88
|
+
compressionType: audioFormat === 1 ? 'None' : AUDIO_FORMATS[audioFormat],
|
|
89
|
+
dataChunkOffset,
|
|
90
|
+
};
|
|
91
|
+
};
|
|
92
|
+
//# sourceMappingURL=getWavFileInfo.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"getWavFileInfo.js","sourceRoot":"","sources":["../../src/utils/getWavFileInfo.ts"],"names":[],"mappings":"AAAA,yDAAyD;AAGzD,OAAO,EACH,aAAa,EACb,iBAAiB,EACjB,mBAAmB,EACnB,YAAY,EACZ,aAAa,EACb,WAAW,EACX,WAAW,GACd,MAAM,cAAc,CAAA;AAErB,4BAA4B;AAC5B,MAAM,aAAa,GAA8B;IAC7C,CAAC,EAAE,KAAK;IACR,CAAC,EAAE,YAAY;IACf,CAAC,EAAE,yBAAyB;IAC5B,CAAC,EAAE,yBAAyB;IAC5B,KAAK,EAAE,wBAAwB;CAClC,CAAA;AAoBD;;;;;GAKG;AACH,MAAM,CAAC,MAAM,cAAc,GAAG,KAAK,EAC/B,WAAwB,EACJ,EAAE;IACtB,MAAM,IAAI,GAAG,IAAI,QAAQ,CAAC,WAAW,CAAC,CAAA;IAEtC,8CAA8C;IAC9C,MAAM,UAAU,GAAG,IAAI,CAAC,SAAS,CAAC,CAAC,EAAE,KAAK,CAAC,CAAA;IAC3C,MAAM,UAAU,GAAG,IAAI,CAAC,SAAS,CAAC,CAAC,EAAE,KAAK,CAAC,CAAA;IAC3C,IAAI,UAAU,KAAK,WAAW,IAAI,UAAU,KAAK,WAAW,EAAE,CAAC;QAC3D,MAAM,IAAI,KAAK,CAAC,kBAAkB,CAAC,CAAA;IACvC,CAAC;IAED,wCAAwC;IACxC,IAAI,cAAc,GAAG,EAAE,CAAA;IACvB,IAAI,UAAU,GAAe,mBAAmB,CAAA;IAChD,IAAI,WAAW,GAAG,CAAC,CAAA;IACnB,IAAI,QAAQ,GAAa,iBAAiB,CAAA;IAC1C,IAAI,aAAa,GAAG,CAAC,CAAA;IACrB,IAAI,WAAW,GAAG,CAAC,CAAA;IACnB,IAAI,QAAQ,GAAG,CAAC,CAAA;IAChB,IAAI,UAAU,GAAG,CAAC,CAAA;IAClB,IAAI,gBAAgB,GAAG,EAAE,CAAA;IACzB,IAAI,QAAQ,GAAG,EAAE,CAAA;IACjB,IAAI,eAAe,GAAG,CAAC,CAAA;IAEvB,oDAAoD;IACpD,OAAO,cAAc,GAAG,IAAI,CAAC,UAAU,EAAE,CAAC;QACtC,MAAM,OAAO,GAAG,IAAI,CAAC,SAAS,CAAC,cAAc,EAAE,KAAK,CAAC,CAAA;QACrD,MAAM,SAAS,GAAG,IAAI,CAAC,SAAS,CAAC,cAAc,GAAG,CAAC,EAAE,IAAI,CAAC,CAAA;QAC1D,IAAI,OAAO,KAAK,YAAY,EAAE,CAAC;YAC3B,SAAS;YACT,WAAW,GAAG,IAAI,CAAC,SAAS,CAAC,cAAc,GAAG,CAAC,EAAE,IAAI,CAAC,CAAA;YACtD,IAAI,CAAC,aAAa,CAAC,WAAW,CAAC,EAAE,CAAC;gBAC9B,MAAM,IAAI,KAAK,CAAC,6BAA6B,CAAC,CAAA;YAClD,CAAC;YACD,WAAW,GAAG,IAAI,CAAC,SAAS,CAAC,cAAc,GAAG,EAAE,EAAE,IAAI,CAAC,CAAA;YACvD,UAAU,GAAG,IAAI,CAAC,SAAS,CAAC,cAAc,GAAG,EAAE,EAAE,IAAI,CAAe,CAAA;YACpE,QAAQ,GAAG,IAAI,CAAC,SAAS,CAAC,cAAc,GAAG,EAAE,EAAE,IAAI,CAAC,CAAA;YACpD,UAAU,GAAG,IAAI,CAAC,SAAS,CAAC,cAAc,GAAG,EAAE,EAAE,IAAI,CAAC,CAAA;YACtD,QAAQ,GAAG,IAAI,CAAC,SAAS,CAAC,cAAc,GAAG,EAAE,EAAE,IAAI,CAAa,CAAA;QACpE,CAAC;aAAM,IAAI,OAAO,KAAK,aAAa,EAAE,CAAC;YACnC,SAAS;YACT,aAAa,GAAG,SAAS,CAAA;YACzB,eAAe,GAAG,cAAc,GAAG,CAAC,CAAA,CAAC,8BAA8B;YACnE,MAAK;QACT,CAAC;aAAM,IAAI,OAAO,KAAK,aAAa,EAAE,CAAC;YACnC,SAAS;YACT,sFAAsF;YACtF,MAAM,SAAS,GAAG,cAAc,GAAG,CAAC,CAAA;YACpC,MAAM,QAAQ,GAAG,IAAI,WAAW,EAAE,CAAC,MAAM,CACrC,IAAI,UAAU,CACV,WAAW,CAAC,KAAK,CAAC,SAAS,EAAE,SAAS,GAAG,SAAS,CAAC,CACtD,CACJ,CAAA;YACD,MAAM,SAAS,GAAG,QAAQ,CAAC,KAAK,CAAC,IAAI,CAAC,CAAA;YACtC,gBAAgB,GAAG,SAAS,CAAC,CAAC,CAAC,CAAA;YAC/B,QAAQ,GAAG,SAAS,CAAC,CAAC,CAAC,CAAA;QAC3B,CAAC;QACD,cAAc,IAAI,CAAC,GAAG,SAAS,CAAA;IACnC,CAAC;IAED,IAAI,CAAC,UAAU,IAAI,CAAC,WAAW,IAAI,CAAC,QAAQ,IAAI,CAAC,aAAa,EAAE,CAAC;QAC7D,MAAM,IAAI,KAAK,CAAC,iCAAiC,CAAC,CAAA;IACtD,CAAC;IAED,qBAAqB;IACrB,MAAM,cAAc,GAAG,QAAQ,GAAG,CAAC,CAAA;IACnC,MAAM,UAAU,GAAG,aAAa,GAAG,CAAC,WAAW,GAAG,cAAc,CAAC,CAAA;IACjE,MAAM,UAAU,GAAG,CAAC,UAAU,GAAG,UAAU,CAAC,GAAG,IAAI,CAAA;IAEnD,OAAO;QACH,UAAU;QACV,WAAW;QACX,QAAQ;QACR,IAAI,EAAE,WAAW,CAAC,UAAU;QAC5B,UAAU;QACV,sBAAsB,EAAE,aAAa,CAAC,WAAW,CAAC;QAClD,QAAQ;QACR,UAAU;QACV,gBAAgB,EAAE,gBAAgB,IAAI,SAAS;QAC/C,QAAQ,EAAE,QAAQ,IAAI,SAAS;QAC/B,eAAe,EACX,WAAW,KAAK,CAAC,CAAC,CAAC,CAAC,MAAM,CAAC,CAAC,CAAC,aAAa,CAAC,WAAW,CAAC;QAC3D,eAAe;KAClB,CAAA;AACL,CAAC,CAAA","sourcesContent":["// packages/expo-audio-stream/src/utils/getWavFileInfo.ts\n\nimport { BitDepth, SampleRate } from '../ExpoAudioStream.types'\nimport {\n DATA_CHUNK_ID,\n DEFAULT_BIT_DEPTH,\n DEFAULT_SAMPLE_RATE,\n FMT_CHUNK_ID,\n INFO_CHUNK_ID,\n RIFF_HEADER,\n WAVE_HEADER,\n} from '../constants'\n\n// Audio format descriptions\nconst AUDIO_FORMATS: { [key: number]: string } = {\n 1: 'PCM',\n 3: 'IEEE float',\n 6: '8-bit ITU-T G.711 A-law',\n 7: '8-bit ITU-T G.711 µ-law',\n 65534: 'WAVE_FORMAT_EXTENSIBLE',\n}\n\n/**\n * Interface representing the metadata of a WAV file.\n */\nexport interface WavFileInfo {\n sampleRate: SampleRate\n numChannels: number\n bitDepth: BitDepth\n size: number // in bytes\n durationMs: number // in ms\n audioFormatDescription: string // Description of the audio format\n byteRate: number // Average bytes per second\n blockAlign: number // Number of bytes for one sample including all channels\n creationDateTime?: string // Optional creation date and time\n comments?: string // Optional comments or tags\n compressionType?: string // Optional compression type\n dataChunkOffset: number // Position of the first data chunk\n}\n\n/**\n * Extracts metadata from a WAV buffer.\n *\n * @param arrayBuffer - The array buffer containing the WAV data.\n * @returns A promise that resolves to the extracted metadata.\n */\nexport const getWavFileInfo = async (\n arrayBuffer: ArrayBuffer\n): Promise<WavFileInfo> => {\n const view = new DataView(arrayBuffer)\n\n // Check if the file is a valid RIFF/WAVE file\n const riffHeader = view.getUint32(0, false)\n const waveHeader = view.getUint32(8, false)\n if (riffHeader !== RIFF_HEADER || waveHeader !== WAVE_HEADER) {\n throw new Error('Invalid WAV file')\n }\n\n // Initialize variables for the metadata\n let fmtChunkOffset = 12\n let sampleRate: SampleRate = DEFAULT_SAMPLE_RATE\n let numChannels = 0\n let bitDepth: BitDepth = DEFAULT_BIT_DEPTH\n let dataChunkSize = 0\n let audioFormat = 0\n let byteRate = 0\n let blockAlign = 0\n let creationDateTime = ''\n let comments = ''\n let dataChunkOffset = 0\n\n // Parse chunks to find the \"fmt \" and \"data\" chunks\n while (fmtChunkOffset < view.byteLength) {\n const chunkId = view.getUint32(fmtChunkOffset, false)\n const chunkSize = view.getUint32(fmtChunkOffset + 4, true)\n if (chunkId === FMT_CHUNK_ID) {\n // \"fmt \"\n audioFormat = view.getUint16(fmtChunkOffset + 8, true)\n if (!AUDIO_FORMATS[audioFormat]) {\n throw new Error('Unsupported WAV file format')\n }\n numChannels = view.getUint16(fmtChunkOffset + 10, true)\n sampleRate = view.getUint32(fmtChunkOffset + 12, true) as SampleRate\n byteRate = view.getUint32(fmtChunkOffset + 16, true)\n blockAlign = view.getUint16(fmtChunkOffset + 20, true)\n bitDepth = view.getUint16(fmtChunkOffset + 22, true) as BitDepth\n } else if (chunkId === DATA_CHUNK_ID) {\n // \"data\"\n dataChunkSize = chunkSize\n dataChunkOffset = fmtChunkOffset + 8 // Position after chunk header\n break\n } else if (chunkId === INFO_CHUNK_ID) {\n // \"INFO\"\n // Read INFO chunk (assuming it contains a text-based creation date/time and comments)\n const infoStart = fmtChunkOffset + 8\n const infoText = new TextDecoder().decode(\n new Uint8Array(\n arrayBuffer.slice(infoStart, infoStart + chunkSize)\n )\n )\n const infoParts = infoText.split('\\0')\n creationDateTime = infoParts[0]\n comments = infoParts[1]\n }\n fmtChunkOffset += 8 + chunkSize\n }\n\n if (!sampleRate || !numChannels || !bitDepth || !dataChunkSize) {\n throw new Error('Incomplete WAV file information')\n }\n\n // Calculate duration\n const bytesPerSample = bitDepth / 8\n const numSamples = dataChunkSize / (numChannels * bytesPerSample)\n const durationMs = (numSamples / sampleRate) * 1000\n\n return {\n sampleRate,\n numChannels,\n bitDepth,\n size: arrayBuffer.byteLength,\n durationMs,\n audioFormatDescription: AUDIO_FORMATS[audioFormat],\n byteRate,\n blockAlign,\n creationDateTime: creationDateTime || undefined,\n comments: comments || undefined,\n compressionType:\n audioFormat === 1 ? 'None' : AUDIO_FORMATS[audioFormat],\n dataChunkOffset,\n }\n}\n"]}
|
|
@@ -0,0 +1,9 @@
|
|
|
1
|
+
interface WavHeaderOptions {
|
|
2
|
+
buffer: ArrayBuffer;
|
|
3
|
+
sampleRate: number;
|
|
4
|
+
numChannels: number;
|
|
5
|
+
bitDepth: number;
|
|
6
|
+
}
|
|
7
|
+
export declare const writeWavHeader: ({ buffer, sampleRate, numChannels, bitDepth, }: WavHeaderOptions) => ArrayBuffer;
|
|
8
|
+
export {};
|
|
9
|
+
//# sourceMappingURL=writeWavHeader.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"writeWavHeader.d.ts","sourceRoot":"","sources":["../../src/utils/writeWavHeader.ts"],"names":[],"mappings":"AACA,UAAU,gBAAgB;IACtB,MAAM,EAAE,WAAW,CAAA;IACnB,UAAU,EAAE,MAAM,CAAA;IAClB,WAAW,EAAE,MAAM,CAAA;IACnB,QAAQ,EAAE,MAAM,CAAA;CACnB;AAED,eAAO,MAAM,cAAc,mDAKxB,gBAAgB,KAAG,WA0CrB,CAAA"}
|
|
@@ -0,0 +1,41 @@
|
|
|
1
|
+
export const writeWavHeader = ({ buffer, sampleRate, numChannels, bitDepth, }) => {
|
|
2
|
+
const bytesPerSample = bitDepth / 8;
|
|
3
|
+
const numSamples = buffer.byteLength / (numChannels * bytesPerSample);
|
|
4
|
+
const view = new DataView(buffer);
|
|
5
|
+
const blockAlign = numChannels * bytesPerSample;
|
|
6
|
+
const byteRate = sampleRate * blockAlign;
|
|
7
|
+
// Function to write a string to the DataView
|
|
8
|
+
const writeString = (view, offset, string) => {
|
|
9
|
+
for (let i = 0; i < string.length; i++) {
|
|
10
|
+
view.setUint8(offset + i, string.charCodeAt(i));
|
|
11
|
+
}
|
|
12
|
+
};
|
|
13
|
+
// Check if the buffer already has a WAV header by looking for "RIFF" at the start
|
|
14
|
+
const existingHeader = view.getUint32(0, false) === 0x52494646; // "RIFF" in ASCII
|
|
15
|
+
if (!existingHeader) {
|
|
16
|
+
// Write the WAV header
|
|
17
|
+
writeString(view, 0, 'RIFF'); // ChunkID
|
|
18
|
+
view.setUint32(4, 36 + numSamples * blockAlign, true); // ChunkSize
|
|
19
|
+
writeString(view, 8, 'WAVE'); // Format
|
|
20
|
+
writeString(view, 12, 'fmt '); // Subchunk1ID
|
|
21
|
+
view.setUint32(16, 16, true); // Subchunk1Size (16 for PCM)
|
|
22
|
+
view.setUint16(20, bitDepth === 32 ? 3 : 1, true); // AudioFormat (3 for float, 1 for PCM)
|
|
23
|
+
view.setUint16(22, numChannels, true); // NumChannels
|
|
24
|
+
view.setUint32(24, sampleRate, true); // SampleRate
|
|
25
|
+
view.setUint32(28, byteRate, true); // ByteRate
|
|
26
|
+
view.setUint16(32, blockAlign, true); // BlockAlign
|
|
27
|
+
view.setUint16(34, bitDepth, true); // BitsPerSample
|
|
28
|
+
writeString(view, 36, 'data'); // Subchunk2ID
|
|
29
|
+
view.setUint32(40, numSamples * blockAlign, true); // Subchunk2Size
|
|
30
|
+
}
|
|
31
|
+
else {
|
|
32
|
+
// Update the existing WAV header if necessary
|
|
33
|
+
view.setUint32(4, 36 + numSamples * blockAlign, true); // Update ChunkSize
|
|
34
|
+
view.setUint32(24, sampleRate, true); // Update SampleRate
|
|
35
|
+
view.setUint32(28, byteRate, true); // Update ByteRate
|
|
36
|
+
view.setUint16(32, blockAlign, true); // Update BlockAlign
|
|
37
|
+
view.setUint32(40, numSamples * blockAlign, true); // Update Subchunk2Size
|
|
38
|
+
}
|
|
39
|
+
return buffer;
|
|
40
|
+
};
|
|
41
|
+
//# sourceMappingURL=writeWavHeader.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"writeWavHeader.js","sourceRoot":"","sources":["../../src/utils/writeWavHeader.ts"],"names":[],"mappings":"AAQA,MAAM,CAAC,MAAM,cAAc,GAAG,CAAC,EAC3B,MAAM,EACN,UAAU,EACV,WAAW,EACX,QAAQ,GACO,EAAe,EAAE;IAChC,MAAM,cAAc,GAAG,QAAQ,GAAG,CAAC,CAAA;IACnC,MAAM,UAAU,GAAG,MAAM,CAAC,UAAU,GAAG,CAAC,WAAW,GAAG,cAAc,CAAC,CAAA;IACrE,MAAM,IAAI,GAAG,IAAI,QAAQ,CAAC,MAAM,CAAC,CAAA;IACjC,MAAM,UAAU,GAAG,WAAW,GAAG,cAAc,CAAA;IAC/C,MAAM,QAAQ,GAAG,UAAU,GAAG,UAAU,CAAA;IAExC,6CAA6C;IAC7C,MAAM,WAAW,GAAG,CAAC,IAAc,EAAE,MAAc,EAAE,MAAc,EAAE,EAAE;QACnE,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,GAAG,MAAM,CAAC,MAAM,EAAE,CAAC,EAAE,EAAE,CAAC;YACrC,IAAI,CAAC,QAAQ,CAAC,MAAM,GAAG,CAAC,EAAE,MAAM,CAAC,UAAU,CAAC,CAAC,CAAC,CAAC,CAAA;QACnD,CAAC;IACL,CAAC,CAAA;IAED,kFAAkF;IAClF,MAAM,cAAc,GAAG,IAAI,CAAC,SAAS,CAAC,CAAC,EAAE,KAAK,CAAC,KAAK,UAAU,CAAA,CAAC,kBAAkB;IAEjF,IAAI,CAAC,cAAc,EAAE,CAAC;QAClB,uBAAuB;QACvB,WAAW,CAAC,IAAI,EAAE,CAAC,EAAE,MAAM,CAAC,CAAA,CAAC,UAAU;QACvC,IAAI,CAAC,SAAS,CAAC,CAAC,EAAE,EAAE,GAAG,UAAU,GAAG,UAAU,EAAE,IAAI,CAAC,CAAA,CAAC,YAAY;QAClE,WAAW,CAAC,IAAI,EAAE,CAAC,EAAE,MAAM,CAAC,CAAA,CAAC,SAAS;QACtC,WAAW,CAAC,IAAI,EAAE,EAAE,EAAE,MAAM,CAAC,CAAA,CAAC,cAAc;QAC5C,IAAI,CAAC,SAAS,CAAC,EAAE,EAAE,EAAE,EAAE,IAAI,CAAC,CAAA,CAAC,6BAA6B;QAC1D,IAAI,CAAC,SAAS,CAAC,EAAE,EAAE,QAAQ,KAAK,EAAE,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,EAAE,IAAI,CAAC,CAAA,CAAC,uCAAuC;QACzF,IAAI,CAAC,SAAS,CAAC,EAAE,EAAE,WAAW,EAAE,IAAI,CAAC,CAAA,CAAC,cAAc;QACpD,IAAI,CAAC,SAAS,CAAC,EAAE,EAAE,UAAU,EAAE,IAAI,CAAC,CAAA,CAAC,aAAa;QAClD,IAAI,CAAC,SAAS,CAAC,EAAE,EAAE,QAAQ,EAAE,IAAI,CAAC,CAAA,CAAC,WAAW;QAC9C,IAAI,CAAC,SAAS,CAAC,EAAE,EAAE,UAAU,EAAE,IAAI,CAAC,CAAA,CAAC,aAAa;QAClD,IAAI,CAAC,SAAS,CAAC,EAAE,EAAE,QAAQ,EAAE,IAAI,CAAC,CAAA,CAAC,gBAAgB;QACnD,WAAW,CAAC,IAAI,EAAE,EAAE,EAAE,MAAM,CAAC,CAAA,CAAC,cAAc;QAC5C,IAAI,CAAC,SAAS,CAAC,EAAE,EAAE,UAAU,GAAG,UAAU,EAAE,IAAI,CAAC,CAAA,CAAC,gBAAgB;IACtE,CAAC;SAAM,CAAC;QACJ,8CAA8C;QAC9C,IAAI,CAAC,SAAS,CAAC,CAAC,EAAE,EAAE,GAAG,UAAU,GAAG,UAAU,EAAE,IAAI,CAAC,CAAA,CAAC,mBAAmB;QACzE,IAAI,CAAC,SAAS,CAAC,EAAE,EAAE,UAAU,EAAE,IAAI,CAAC,CAAA,CAAC,oBAAoB;QACzD,IAAI,CAAC,SAAS,CAAC,EAAE,EAAE,QAAQ,EAAE,IAAI,CAAC,CAAA,CAAC,kBAAkB;QACrD,IAAI,CAAC,SAAS,CAAC,EAAE,EAAE,UAAU,EAAE,IAAI,CAAC,CAAA,CAAC,oBAAoB;QACzD,IAAI,CAAC,SAAS,CAAC,EAAE,EAAE,UAAU,GAAG,UAAU,EAAE,IAAI,CAAC,CAAA,CAAC,uBAAuB;IAC7E,CAAC;IAED,OAAO,MAAM,CAAA;AACjB,CAAC,CAAA","sourcesContent":["// packages/expo-audio-stream/src/utils/writeWavHeader.ts\ninterface WavHeaderOptions {\n buffer: ArrayBuffer\n sampleRate: number\n numChannels: number\n bitDepth: number\n}\n\nexport const writeWavHeader = ({\n buffer,\n sampleRate,\n numChannels,\n bitDepth,\n}: WavHeaderOptions): ArrayBuffer => {\n const bytesPerSample = bitDepth / 8\n const numSamples = buffer.byteLength / (numChannels * bytesPerSample)\n const view = new DataView(buffer)\n const blockAlign = numChannels * bytesPerSample\n const byteRate = sampleRate * blockAlign\n\n // Function to write a string to the DataView\n const writeString = (view: DataView, offset: number, string: string) => {\n for (let i = 0; i < string.length; i++) {\n view.setUint8(offset + i, string.charCodeAt(i))\n }\n }\n\n // Check if the buffer already has a WAV header by looking for \"RIFF\" at the start\n const existingHeader = view.getUint32(0, false) === 0x52494646 // \"RIFF\" in ASCII\n\n if (!existingHeader) {\n // Write the WAV header\n writeString(view, 0, 'RIFF') // ChunkID\n view.setUint32(4, 36 + numSamples * blockAlign, true) // ChunkSize\n writeString(view, 8, 'WAVE') // Format\n writeString(view, 12, 'fmt ') // Subchunk1ID\n view.setUint32(16, 16, true) // Subchunk1Size (16 for PCM)\n view.setUint16(20, bitDepth === 32 ? 3 : 1, true) // AudioFormat (3 for float, 1 for PCM)\n view.setUint16(22, numChannels, true) // NumChannels\n view.setUint32(24, sampleRate, true) // SampleRate\n view.setUint32(28, byteRate, true) // ByteRate\n view.setUint16(32, blockAlign, true) // BlockAlign\n view.setUint16(34, bitDepth, true) // BitsPerSample\n writeString(view, 36, 'data') // Subchunk2ID\n view.setUint32(40, numSamples * blockAlign, true) // Subchunk2Size\n } else {\n // Update the existing WAV header if necessary\n view.setUint32(4, 36 + numSamples * blockAlign, true) // Update ChunkSize\n view.setUint32(24, sampleRate, true) // Update SampleRate\n view.setUint32(28, byteRate, true) // Update ByteRate\n view.setUint16(32, blockAlign, true) // Update BlockAlign\n view.setUint32(40, numSamples * blockAlign, true) // Update Subchunk2Size\n }\n\n return buffer\n}\n"]}
|
|
@@ -0,0 +1,2 @@
|
|
|
1
|
+
export declare const InlineFeaturesExtractor = "\n\n// Unique ID counter\nlet uniqueIdCounter = 0;\n\nself.onmessage = function (event) {\n const {\n channelData, // this is only the newly recorded data when live recording.\n sampleRate,\n pointsPerSecond,\n algorithm,\n bitDepth,\n fullAudioDurationMs,\n numberOfChannels,\n features: _features,\n } = event.data;\n\n console.log(\"[AudioFeaturesExtractor] Worker received message\", event.data);\n const features = _features || {};\n\n const SILENCE_THRESHOLD = 0.01;\n const MIN_SILENCE_DURATION = 1.5 * sampleRate; // 1.5 seconds of silence\n const SPEECH_INERTIA_DURATION = 0.1 * sampleRate; // Speech inertia duration in samples\n const RMS_THRESHOLD = 0.01;\n const ZCR_THRESHOLD = 0.1;\n\n // Placeholder functions for feature extraction\n const extractMFCC = (segmentData, sampleRate) => {\n // Implement MFCC extraction logic here\n return [];\n };\n\n const extractSpectralCentroid = (segmentData, sampleRate) => {\n const magnitudeSpectrum = segmentData.map((v) => v * v);\n const sum = magnitudeSpectrum.reduce((a, b) => a + b, 0);\n if (sum === 0) return 0;\n\n const weightedSum = magnitudeSpectrum.reduce(\n (acc, value, index) => acc + index * value,\n 0,\n );\n return ((weightedSum / sum) * (sampleRate / 2)) / magnitudeSpectrum.length;\n };\n\n const extractSpectralFlatness = (segmentData) => {\n const magnitudeSpectrum = segmentData.map((v) => Math.abs(v));\n const geometricMean = Math.exp(\n magnitudeSpectrum\n .map((v) => Math.log(v + Number.MIN_VALUE))\n .reduce((a, b) => a + b) / magnitudeSpectrum.length,\n );\n const arithmeticMean =\n magnitudeSpectrum.reduce((a, b) => a + b) / magnitudeSpectrum.length;\n return arithmeticMean === 0 ? 0 : geometricMean / arithmeticMean;\n };\n\n const extractSpectralRollOff = (segmentData, sampleRate) => {\n const magnitudeSpectrum = segmentData.map((v) => Math.abs(v));\n const totalEnergy = magnitudeSpectrum.reduce((a, b) => a + b, 0);\n const rollOffThreshold = totalEnergy * 0.85;\n let cumulativeEnergy = 0;\n\n for (let i = 0; i < magnitudeSpectrum.length; i++) {\n cumulativeEnergy += magnitudeSpectrum[i];\n if (cumulativeEnergy >= rollOffThreshold) {\n return (i / magnitudeSpectrum.length) * (sampleRate / 2);\n }\n }\n\n return 0;\n };\n\n const extractSpectralBandwidth = (segmentData, sampleRate) => {\n const centroid = extractSpectralCentroid(segmentData, sampleRate);\n const magnitudeSpectrum = segmentData.map((v) => Math.abs(v));\n const sum = magnitudeSpectrum.reduce((a, b) => a + b, 0);\n if (sum === 0) return 0;\n\n const weightedSum = magnitudeSpectrum.reduce(\n (acc, value, index) => acc + value * Math.pow(index - centroid, 2),\n 0,\n );\n return Math.sqrt(weightedSum / sum);\n };\n\n const extractChromagram = (segmentData, sampleRate) => {\n return []; // TODO implement\n };\n\n const extractHNR = (segmentData) => {\n const frameSize = segmentData.length;\n const autocorrelation = new Float32Array(frameSize);\n\n // Compute the autocorrelation of the segment data\n for (let i = 0; i < frameSize; i++) {\n let sum = 0;\n for (let j = 0; j < frameSize - i; j++) {\n sum += segmentData[j] * segmentData[j + i];\n }\n autocorrelation[i] = sum;\n }\n\n // Find the maximum autocorrelation value (excluding the zero lag)\n const maxAutocorrelation = Math.max(...autocorrelation.subarray(1));\n\n // Compute the HNR\n return autocorrelation[0] !== 0\n ? 10 *\n Math.log10(\n maxAutocorrelation / (autocorrelation[0] - maxAutocorrelation),\n )\n : 0;\n };\n\n const extractWaveform = (\n channelData, // Float32Array\n sampleRate, // number\n pointsPerSecond, // number\n algorithm, // string\n ) => {\n const totalSamples = channelData.length;\n const segmentDuration = totalSamples / sampleRate;\n const totalPoints = Math.max(\n Math.ceil(segmentDuration * pointsPerSecond),\n 1,\n );\n const pointInterval = Math.ceil(totalSamples / totalPoints);\n const dataPoints = [];\n let minAmplitude = Infinity;\n let maxAmplitude = -Infinity;\n let silenceStart = null;\n let lastSpeechEnd = -Infinity;\n let isSpeech = false;\n\n const expectedPoints = segmentDuration * pointsPerSecond;\n const samplesPerPoint = Math.ceil(channelData.length / expectedPoints);\n\n for (let i = 0; i < expectedPoints; i++) {\n const start = i * samplesPerPoint;\n const end = Math.min(start + samplesPerPoint, totalSamples);\n\n let sumSquares = 0;\n let zeroCrossings = 0;\n let prevValue = channelData[start];\n let localMinAmplitude = Infinity;\n let localMaxAmplitude = -Infinity;\n let hasNonZeroValue = false;\n\n // compute values for the segment\n for (let j = start; j < end; j++) {\n const value = channelData[j];\n sumSquares += value * value;\n if (j > start && value * prevValue < 0) {\n zeroCrossings++;\n }\n prevValue = value;\n\n const absValue = Math.abs(value);\n localMinAmplitude = Math.min(localMinAmplitude, absValue);\n localMaxAmplitude = Math.max(localMaxAmplitude, absValue);\n\n if (absValue !== 0) {\n hasNonZeroValue = true;\n }\n }\n\n // Post-processing checks\n if (!hasNonZeroValue) {\n // All values are zero\n localMinAmplitude = 0;\n localMaxAmplitude = 0;\n }\n\n const rms = Math.sqrt(sumSquares / (end - start));\n minAmplitude = Math.min(minAmplitude, rms);\n maxAmplitude = Math.max(maxAmplitude, rms);\n\n const energy = sumSquares;\n const zcr = zeroCrossings / (end - start);\n\n const silent = rms < SILENCE_THRESHOLD;\n const dB = 20 * Math.log10(rms);\n\n if (silent) {\n if (silenceStart === null) {\n silenceStart = start;\n } else if (start - silenceStart > MIN_SILENCE_DURATION) {\n // Silence detected for longer than the threshold, set amplitude to 0\n localMaxAmplitude = 0;\n localMinAmplitude = 0;\n isSpeech = false;\n }\n } else {\n silenceStart = null;\n if (!isSpeech && start - lastSpeechEnd < SPEECH_INERTIA_DURATION) {\n isSpeech = true;\n }\n lastSpeechEnd = end;\n }\n\n const activeSpeech =\n (rms > RMS_THRESHOLD && zcr > ZCR_THRESHOLD) ||\n (isSpeech && start - lastSpeechEnd < SPEECH_INERTIA_DURATION);\n\n if (activeSpeech) {\n isSpeech = true;\n lastSpeechEnd = end;\n } else {\n isSpeech = false;\n }\n\n const bytesPerSample = bitDepth / 8;\n const startPosition = start * bytesPerSample * numberOfChannels; // Calculate start position in bytes\n const endPosition = end * bytesPerSample * numberOfChannels; // Calculate end position in bytes\n\n // Compute features\n const segmentData = channelData.slice(start, end);\n const mfcc = features.mfcc ? extractMFCC(segmentData, sampleRate) : [];\n const spectralCentroid = features.spectralCentroid\n ? extractSpectralCentroid(segmentData, sampleRate)\n : 0;\n const spectralFlatness = features.spectralFlatness\n ? extractSpectralFlatness(segmentData)\n : 0;\n const spectralRollOff = features.spectralRollOff\n ? extractSpectralRollOff(segmentData, sampleRate)\n : 0;\n const spectralBandwidth = features.spectralBandwidth\n ? extractSpectralBandwidth(segmentData, sampleRate)\n : 0;\n const chromagram = features.chromagram\n ? extractChromagram(segmentData, sampleRate)\n : [];\n const hnr = features.hnr ? extractHNR(segmentData) : 0;\n\n const newData = {\n id: uniqueIdCounter++, // Assign unique ID and increment the counter\n amplitude: algorithm === \"peak\" ? localMaxAmplitude : rms,\n activeSpeech,\n dB,\n silent,\n features: {\n energy,\n rms,\n minAmplitude: localMinAmplitude,\n maxAmplitude: localMaxAmplitude,\n zcr,\n mfcc: [], // Placeholder for MFCC features\n spectralCentroid, // Computed spectral centroid\n spectralFlatness, // Computed spectral flatness\n spectralRollOff, // Computed spectral roll-off\n spectralBandwidth, // Computed spectral bandwidth\n chromagram, // Computed chromagram\n hnr, // Computed HNR\n },\n startTime: start / sampleRate,\n endTime: end / sampleRate,\n startPosition,\n endPosition,\n samples: end - start,\n speaker: 0, // Assuming speaker detection is to be handled later\n };\n\n dataPoints.push(newData);\n }\n\n return {\n pointsPerSecond,\n durationMs: fullAudioDurationMs,\n bitDepth,\n samples: totalSamples,\n numberOfChannels,\n sampleRate,\n dataPoints,\n amplitudeRange: {\n min: minAmplitude,\n max: maxAmplitude,\n },\n speakerChanges: [], // Placeholder for future speaker detection logic\n };\n };\n\n try {\n const result = extractWaveform(\n channelData,\n sampleRate,\n pointsPerSecond,\n algorithm,\n );\n self.postMessage({\n command: \"features\",\n result,\n });\n } catch (error) {\n console.error(\"[AudioFeaturesExtractor] Error in processing\", error);\n self.postMessage({ error: error.message });\n } finally {\n // Do not close the worker so it can be re-used for subsequent messages\n // self.close();\n }\n};\n";
|
|
2
|
+
//# sourceMappingURL=InlineFeaturesExtractor.web.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"InlineFeaturesExtractor.web.d.ts","sourceRoot":"","sources":["../../src/workers/InlineFeaturesExtractor.web.tsx"],"names":[],"mappings":"AAAA,eAAO,MAAM,uBAAuB,umTA6SnC,CAAA"}
|
|
@@ -0,0 +1,303 @@
|
|
|
1
|
+
export const InlineFeaturesExtractor = `
|
|
2
|
+
|
|
3
|
+
// Unique ID counter
|
|
4
|
+
let uniqueIdCounter = 0;
|
|
5
|
+
|
|
6
|
+
self.onmessage = function (event) {
|
|
7
|
+
const {
|
|
8
|
+
channelData, // this is only the newly recorded data when live recording.
|
|
9
|
+
sampleRate,
|
|
10
|
+
pointsPerSecond,
|
|
11
|
+
algorithm,
|
|
12
|
+
bitDepth,
|
|
13
|
+
fullAudioDurationMs,
|
|
14
|
+
numberOfChannels,
|
|
15
|
+
features: _features,
|
|
16
|
+
} = event.data;
|
|
17
|
+
|
|
18
|
+
console.log("[AudioFeaturesExtractor] Worker received message", event.data);
|
|
19
|
+
const features = _features || {};
|
|
20
|
+
|
|
21
|
+
const SILENCE_THRESHOLD = 0.01;
|
|
22
|
+
const MIN_SILENCE_DURATION = 1.5 * sampleRate; // 1.5 seconds of silence
|
|
23
|
+
const SPEECH_INERTIA_DURATION = 0.1 * sampleRate; // Speech inertia duration in samples
|
|
24
|
+
const RMS_THRESHOLD = 0.01;
|
|
25
|
+
const ZCR_THRESHOLD = 0.1;
|
|
26
|
+
|
|
27
|
+
// Placeholder functions for feature extraction
|
|
28
|
+
const extractMFCC = (segmentData, sampleRate) => {
|
|
29
|
+
// Implement MFCC extraction logic here
|
|
30
|
+
return [];
|
|
31
|
+
};
|
|
32
|
+
|
|
33
|
+
const extractSpectralCentroid = (segmentData, sampleRate) => {
|
|
34
|
+
const magnitudeSpectrum = segmentData.map((v) => v * v);
|
|
35
|
+
const sum = magnitudeSpectrum.reduce((a, b) => a + b, 0);
|
|
36
|
+
if (sum === 0) return 0;
|
|
37
|
+
|
|
38
|
+
const weightedSum = magnitudeSpectrum.reduce(
|
|
39
|
+
(acc, value, index) => acc + index * value,
|
|
40
|
+
0,
|
|
41
|
+
);
|
|
42
|
+
return ((weightedSum / sum) * (sampleRate / 2)) / magnitudeSpectrum.length;
|
|
43
|
+
};
|
|
44
|
+
|
|
45
|
+
const extractSpectralFlatness = (segmentData) => {
|
|
46
|
+
const magnitudeSpectrum = segmentData.map((v) => Math.abs(v));
|
|
47
|
+
const geometricMean = Math.exp(
|
|
48
|
+
magnitudeSpectrum
|
|
49
|
+
.map((v) => Math.log(v + Number.MIN_VALUE))
|
|
50
|
+
.reduce((a, b) => a + b) / magnitudeSpectrum.length,
|
|
51
|
+
);
|
|
52
|
+
const arithmeticMean =
|
|
53
|
+
magnitudeSpectrum.reduce((a, b) => a + b) / magnitudeSpectrum.length;
|
|
54
|
+
return arithmeticMean === 0 ? 0 : geometricMean / arithmeticMean;
|
|
55
|
+
};
|
|
56
|
+
|
|
57
|
+
const extractSpectralRollOff = (segmentData, sampleRate) => {
|
|
58
|
+
const magnitudeSpectrum = segmentData.map((v) => Math.abs(v));
|
|
59
|
+
const totalEnergy = magnitudeSpectrum.reduce((a, b) => a + b, 0);
|
|
60
|
+
const rollOffThreshold = totalEnergy * 0.85;
|
|
61
|
+
let cumulativeEnergy = 0;
|
|
62
|
+
|
|
63
|
+
for (let i = 0; i < magnitudeSpectrum.length; i++) {
|
|
64
|
+
cumulativeEnergy += magnitudeSpectrum[i];
|
|
65
|
+
if (cumulativeEnergy >= rollOffThreshold) {
|
|
66
|
+
return (i / magnitudeSpectrum.length) * (sampleRate / 2);
|
|
67
|
+
}
|
|
68
|
+
}
|
|
69
|
+
|
|
70
|
+
return 0;
|
|
71
|
+
};
|
|
72
|
+
|
|
73
|
+
const extractSpectralBandwidth = (segmentData, sampleRate) => {
|
|
74
|
+
const centroid = extractSpectralCentroid(segmentData, sampleRate);
|
|
75
|
+
const magnitudeSpectrum = segmentData.map((v) => Math.abs(v));
|
|
76
|
+
const sum = magnitudeSpectrum.reduce((a, b) => a + b, 0);
|
|
77
|
+
if (sum === 0) return 0;
|
|
78
|
+
|
|
79
|
+
const weightedSum = magnitudeSpectrum.reduce(
|
|
80
|
+
(acc, value, index) => acc + value * Math.pow(index - centroid, 2),
|
|
81
|
+
0,
|
|
82
|
+
);
|
|
83
|
+
return Math.sqrt(weightedSum / sum);
|
|
84
|
+
};
|
|
85
|
+
|
|
86
|
+
const extractChromagram = (segmentData, sampleRate) => {
|
|
87
|
+
return []; // TODO implement
|
|
88
|
+
};
|
|
89
|
+
|
|
90
|
+
const extractHNR = (segmentData) => {
|
|
91
|
+
const frameSize = segmentData.length;
|
|
92
|
+
const autocorrelation = new Float32Array(frameSize);
|
|
93
|
+
|
|
94
|
+
// Compute the autocorrelation of the segment data
|
|
95
|
+
for (let i = 0; i < frameSize; i++) {
|
|
96
|
+
let sum = 0;
|
|
97
|
+
for (let j = 0; j < frameSize - i; j++) {
|
|
98
|
+
sum += segmentData[j] * segmentData[j + i];
|
|
99
|
+
}
|
|
100
|
+
autocorrelation[i] = sum;
|
|
101
|
+
}
|
|
102
|
+
|
|
103
|
+
// Find the maximum autocorrelation value (excluding the zero lag)
|
|
104
|
+
const maxAutocorrelation = Math.max(...autocorrelation.subarray(1));
|
|
105
|
+
|
|
106
|
+
// Compute the HNR
|
|
107
|
+
return autocorrelation[0] !== 0
|
|
108
|
+
? 10 *
|
|
109
|
+
Math.log10(
|
|
110
|
+
maxAutocorrelation / (autocorrelation[0] - maxAutocorrelation),
|
|
111
|
+
)
|
|
112
|
+
: 0;
|
|
113
|
+
};
|
|
114
|
+
|
|
115
|
+
const extractWaveform = (
|
|
116
|
+
channelData, // Float32Array
|
|
117
|
+
sampleRate, // number
|
|
118
|
+
pointsPerSecond, // number
|
|
119
|
+
algorithm, // string
|
|
120
|
+
) => {
|
|
121
|
+
const totalSamples = channelData.length;
|
|
122
|
+
const segmentDuration = totalSamples / sampleRate;
|
|
123
|
+
const totalPoints = Math.max(
|
|
124
|
+
Math.ceil(segmentDuration * pointsPerSecond),
|
|
125
|
+
1,
|
|
126
|
+
);
|
|
127
|
+
const pointInterval = Math.ceil(totalSamples / totalPoints);
|
|
128
|
+
const dataPoints = [];
|
|
129
|
+
let minAmplitude = Infinity;
|
|
130
|
+
let maxAmplitude = -Infinity;
|
|
131
|
+
let silenceStart = null;
|
|
132
|
+
let lastSpeechEnd = -Infinity;
|
|
133
|
+
let isSpeech = false;
|
|
134
|
+
|
|
135
|
+
const expectedPoints = segmentDuration * pointsPerSecond;
|
|
136
|
+
const samplesPerPoint = Math.ceil(channelData.length / expectedPoints);
|
|
137
|
+
|
|
138
|
+
for (let i = 0; i < expectedPoints; i++) {
|
|
139
|
+
const start = i * samplesPerPoint;
|
|
140
|
+
const end = Math.min(start + samplesPerPoint, totalSamples);
|
|
141
|
+
|
|
142
|
+
let sumSquares = 0;
|
|
143
|
+
let zeroCrossings = 0;
|
|
144
|
+
let prevValue = channelData[start];
|
|
145
|
+
let localMinAmplitude = Infinity;
|
|
146
|
+
let localMaxAmplitude = -Infinity;
|
|
147
|
+
let hasNonZeroValue = false;
|
|
148
|
+
|
|
149
|
+
// compute values for the segment
|
|
150
|
+
for (let j = start; j < end; j++) {
|
|
151
|
+
const value = channelData[j];
|
|
152
|
+
sumSquares += value * value;
|
|
153
|
+
if (j > start && value * prevValue < 0) {
|
|
154
|
+
zeroCrossings++;
|
|
155
|
+
}
|
|
156
|
+
prevValue = value;
|
|
157
|
+
|
|
158
|
+
const absValue = Math.abs(value);
|
|
159
|
+
localMinAmplitude = Math.min(localMinAmplitude, absValue);
|
|
160
|
+
localMaxAmplitude = Math.max(localMaxAmplitude, absValue);
|
|
161
|
+
|
|
162
|
+
if (absValue !== 0) {
|
|
163
|
+
hasNonZeroValue = true;
|
|
164
|
+
}
|
|
165
|
+
}
|
|
166
|
+
|
|
167
|
+
// Post-processing checks
|
|
168
|
+
if (!hasNonZeroValue) {
|
|
169
|
+
// All values are zero
|
|
170
|
+
localMinAmplitude = 0;
|
|
171
|
+
localMaxAmplitude = 0;
|
|
172
|
+
}
|
|
173
|
+
|
|
174
|
+
const rms = Math.sqrt(sumSquares / (end - start));
|
|
175
|
+
minAmplitude = Math.min(minAmplitude, rms);
|
|
176
|
+
maxAmplitude = Math.max(maxAmplitude, rms);
|
|
177
|
+
|
|
178
|
+
const energy = sumSquares;
|
|
179
|
+
const zcr = zeroCrossings / (end - start);
|
|
180
|
+
|
|
181
|
+
const silent = rms < SILENCE_THRESHOLD;
|
|
182
|
+
const dB = 20 * Math.log10(rms);
|
|
183
|
+
|
|
184
|
+
if (silent) {
|
|
185
|
+
if (silenceStart === null) {
|
|
186
|
+
silenceStart = start;
|
|
187
|
+
} else if (start - silenceStart > MIN_SILENCE_DURATION) {
|
|
188
|
+
// Silence detected for longer than the threshold, set amplitude to 0
|
|
189
|
+
localMaxAmplitude = 0;
|
|
190
|
+
localMinAmplitude = 0;
|
|
191
|
+
isSpeech = false;
|
|
192
|
+
}
|
|
193
|
+
} else {
|
|
194
|
+
silenceStart = null;
|
|
195
|
+
if (!isSpeech && start - lastSpeechEnd < SPEECH_INERTIA_DURATION) {
|
|
196
|
+
isSpeech = true;
|
|
197
|
+
}
|
|
198
|
+
lastSpeechEnd = end;
|
|
199
|
+
}
|
|
200
|
+
|
|
201
|
+
const activeSpeech =
|
|
202
|
+
(rms > RMS_THRESHOLD && zcr > ZCR_THRESHOLD) ||
|
|
203
|
+
(isSpeech && start - lastSpeechEnd < SPEECH_INERTIA_DURATION);
|
|
204
|
+
|
|
205
|
+
if (activeSpeech) {
|
|
206
|
+
isSpeech = true;
|
|
207
|
+
lastSpeechEnd = end;
|
|
208
|
+
} else {
|
|
209
|
+
isSpeech = false;
|
|
210
|
+
}
|
|
211
|
+
|
|
212
|
+
const bytesPerSample = bitDepth / 8;
|
|
213
|
+
const startPosition = start * bytesPerSample * numberOfChannels; // Calculate start position in bytes
|
|
214
|
+
const endPosition = end * bytesPerSample * numberOfChannels; // Calculate end position in bytes
|
|
215
|
+
|
|
216
|
+
// Compute features
|
|
217
|
+
const segmentData = channelData.slice(start, end);
|
|
218
|
+
const mfcc = features.mfcc ? extractMFCC(segmentData, sampleRate) : [];
|
|
219
|
+
const spectralCentroid = features.spectralCentroid
|
|
220
|
+
? extractSpectralCentroid(segmentData, sampleRate)
|
|
221
|
+
: 0;
|
|
222
|
+
const spectralFlatness = features.spectralFlatness
|
|
223
|
+
? extractSpectralFlatness(segmentData)
|
|
224
|
+
: 0;
|
|
225
|
+
const spectralRollOff = features.spectralRollOff
|
|
226
|
+
? extractSpectralRollOff(segmentData, sampleRate)
|
|
227
|
+
: 0;
|
|
228
|
+
const spectralBandwidth = features.spectralBandwidth
|
|
229
|
+
? extractSpectralBandwidth(segmentData, sampleRate)
|
|
230
|
+
: 0;
|
|
231
|
+
const chromagram = features.chromagram
|
|
232
|
+
? extractChromagram(segmentData, sampleRate)
|
|
233
|
+
: [];
|
|
234
|
+
const hnr = features.hnr ? extractHNR(segmentData) : 0;
|
|
235
|
+
|
|
236
|
+
const newData = {
|
|
237
|
+
id: uniqueIdCounter++, // Assign unique ID and increment the counter
|
|
238
|
+
amplitude: algorithm === "peak" ? localMaxAmplitude : rms,
|
|
239
|
+
activeSpeech,
|
|
240
|
+
dB,
|
|
241
|
+
silent,
|
|
242
|
+
features: {
|
|
243
|
+
energy,
|
|
244
|
+
rms,
|
|
245
|
+
minAmplitude: localMinAmplitude,
|
|
246
|
+
maxAmplitude: localMaxAmplitude,
|
|
247
|
+
zcr,
|
|
248
|
+
mfcc: [], // Placeholder for MFCC features
|
|
249
|
+
spectralCentroid, // Computed spectral centroid
|
|
250
|
+
spectralFlatness, // Computed spectral flatness
|
|
251
|
+
spectralRollOff, // Computed spectral roll-off
|
|
252
|
+
spectralBandwidth, // Computed spectral bandwidth
|
|
253
|
+
chromagram, // Computed chromagram
|
|
254
|
+
hnr, // Computed HNR
|
|
255
|
+
},
|
|
256
|
+
startTime: start / sampleRate,
|
|
257
|
+
endTime: end / sampleRate,
|
|
258
|
+
startPosition,
|
|
259
|
+
endPosition,
|
|
260
|
+
samples: end - start,
|
|
261
|
+
speaker: 0, // Assuming speaker detection is to be handled later
|
|
262
|
+
};
|
|
263
|
+
|
|
264
|
+
dataPoints.push(newData);
|
|
265
|
+
}
|
|
266
|
+
|
|
267
|
+
return {
|
|
268
|
+
pointsPerSecond,
|
|
269
|
+
durationMs: fullAudioDurationMs,
|
|
270
|
+
bitDepth,
|
|
271
|
+
samples: totalSamples,
|
|
272
|
+
numberOfChannels,
|
|
273
|
+
sampleRate,
|
|
274
|
+
dataPoints,
|
|
275
|
+
amplitudeRange: {
|
|
276
|
+
min: minAmplitude,
|
|
277
|
+
max: maxAmplitude,
|
|
278
|
+
},
|
|
279
|
+
speakerChanges: [], // Placeholder for future speaker detection logic
|
|
280
|
+
};
|
|
281
|
+
};
|
|
282
|
+
|
|
283
|
+
try {
|
|
284
|
+
const result = extractWaveform(
|
|
285
|
+
channelData,
|
|
286
|
+
sampleRate,
|
|
287
|
+
pointsPerSecond,
|
|
288
|
+
algorithm,
|
|
289
|
+
);
|
|
290
|
+
self.postMessage({
|
|
291
|
+
command: "features",
|
|
292
|
+
result,
|
|
293
|
+
});
|
|
294
|
+
} catch (error) {
|
|
295
|
+
console.error("[AudioFeaturesExtractor] Error in processing", error);
|
|
296
|
+
self.postMessage({ error: error.message });
|
|
297
|
+
} finally {
|
|
298
|
+
// Do not close the worker so it can be re-used for subsequent messages
|
|
299
|
+
// self.close();
|
|
300
|
+
}
|
|
301
|
+
};
|
|
302
|
+
`;
|
|
303
|
+
//# sourceMappingURL=InlineFeaturesExtractor.web.js.map
|