@speech-sdk/core 0.8.2-alpha → 0.8.2
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +56 -3
- package/dist/audio-decode.d.ts +7 -0
- package/dist/audio-decode.d.ts.map +1 -0
- package/dist/audio-decode.js +109 -0
- package/dist/audio-decode.js.map +1 -0
- package/dist/audio-duration.d.ts.map +1 -1
- package/dist/audio-duration.js +3 -12
- package/dist/audio-duration.js.map +1 -1
- package/dist/audio-output.d.ts.map +1 -1
- package/dist/audio-output.js +31 -10
- package/dist/audio-output.js.map +1 -1
- package/dist/audio-utils.d.ts +2 -0
- package/dist/audio-utils.d.ts.map +1 -1
- package/dist/audio-utils.js +55 -1
- package/dist/audio-utils.js.map +1 -1
- package/dist/captions.d.ts.map +1 -1
- package/dist/captions.js +2 -3
- package/dist/captions.js.map +1 -1
- package/dist/conversation/dispatch.d.ts +1 -0
- package/dist/conversation/dispatch.d.ts.map +1 -1
- package/dist/conversation/dispatch.js +2 -2
- package/dist/conversation/dispatch.js.map +1 -1
- package/dist/conversation/pcm-concat.d.ts +0 -1
- package/dist/conversation/pcm-concat.d.ts.map +1 -1
- package/dist/conversation/pcm-concat.js +6 -143
- package/dist/conversation/pcm-concat.js.map +1 -1
- package/dist/conversation/stitch.d.ts +3 -0
- package/dist/conversation/stitch.d.ts.map +1 -1
- package/dist/conversation/stitch.js +10 -2
- package/dist/conversation/stitch.js.map +1 -1
- package/dist/conversation/types.d.ts +6 -2
- package/dist/conversation/types.d.ts.map +1 -1
- package/dist/encoders/mp3.d.ts.map +1 -1
- package/dist/encoders/mp3.js +40 -22
- package/dist/encoders/mp3.js.map +1 -1
- package/dist/errors.d.ts +9 -0
- package/dist/errors.d.ts.map +1 -1
- package/dist/errors.js +20 -0
- package/dist/errors.js.map +1 -1
- package/dist/generate-conversation.d.ts +2 -2
- package/dist/generate-conversation.d.ts.map +1 -1
- package/dist/generate-conversation.js +131 -44
- package/dist/generate-conversation.js.map +1 -1
- package/dist/generate-speech.d.ts +2 -14
- package/dist/generate-speech.d.ts.map +1 -1
- package/dist/generate-speech.js +223 -39
- package/dist/generate-speech.js.map +1 -1
- package/dist/index.d.ts +4 -1
- package/dist/index.d.ts.map +1 -1
- package/dist/index.js +2 -1
- package/dist/index.js.map +1 -1
- package/dist/pronunciations/errors.d.ts +5 -0
- package/dist/pronunciations/errors.d.ts.map +1 -0
- package/dist/pronunciations/errors.js +8 -0
- package/dist/pronunciations/errors.js.map +1 -0
- package/dist/pronunciations/index.d.ts +5 -0
- package/dist/pronunciations/index.d.ts.map +1 -0
- package/dist/pronunciations/index.js +5 -0
- package/dist/pronunciations/index.js.map +1 -0
- package/dist/pronunciations/inverse-align.d.ts +4 -0
- package/dist/pronunciations/inverse-align.d.ts.map +1 -0
- package/dist/pronunciations/inverse-align.js +54 -0
- package/dist/pronunciations/inverse-align.js.map +1 -0
- package/dist/pronunciations/merge.d.ts +4 -0
- package/dist/pronunciations/merge.d.ts.map +1 -0
- package/dist/pronunciations/merge.js +13 -0
- package/dist/pronunciations/merge.js.map +1 -0
- package/dist/pronunciations/substitute.d.ts +6 -0
- package/dist/pronunciations/substitute.d.ts.map +1 -0
- package/dist/pronunciations/substitute.js +67 -0
- package/dist/pronunciations/substitute.js.map +1 -0
- package/dist/pronunciations/types.d.ts +18 -0
- package/dist/pronunciations/types.d.ts.map +1 -0
- package/dist/pronunciations/types.js +2 -0
- package/dist/pronunciations/types.js.map +1 -0
- package/dist/pronunciations/validate.d.ts +3 -0
- package/dist/pronunciations/validate.d.ts.map +1 -0
- package/dist/pronunciations/validate.js +26 -0
- package/dist/pronunciations/validate.js.map +1 -0
- package/dist/provider-utils.d.ts +1 -0
- package/dist/provider-utils.d.ts.map +1 -1
- package/dist/provider-utils.js +26 -0
- package/dist/provider-utils.js.map +1 -1
- package/dist/providers/cartesia/index.d.ts +22 -0
- package/dist/providers/cartesia/index.d.ts.map +1 -1
- package/dist/providers/cartesia/index.js +48 -0
- package/dist/providers/cartesia/index.js.map +1 -1
- package/dist/providers/deepgram/index.d.ts +16 -0
- package/dist/providers/deepgram/index.d.ts.map +1 -1
- package/dist/providers/deepgram/index.js +35 -0
- package/dist/providers/deepgram/index.js.map +1 -1
- package/dist/providers/elevenlabs/index.d.ts +7 -0
- package/dist/providers/elevenlabs/index.d.ts.map +1 -1
- package/dist/providers/elevenlabs/index.js +29 -0
- package/dist/providers/elevenlabs/index.js.map +1 -1
- package/dist/providers/fal/index.d.ts +5 -3
- package/dist/providers/fal/index.d.ts.map +1 -1
- package/dist/providers/fal/index.js +14 -7
- package/dist/providers/fal/index.js.map +1 -1
- package/dist/providers/fish-audio/index.d.ts +7 -0
- package/dist/providers/fish-audio/index.d.ts.map +1 -1
- package/dist/providers/fish-audio/index.js +24 -0
- package/dist/providers/fish-audio/index.js.map +1 -1
- package/dist/providers/gateway/index.d.ts +8 -0
- package/dist/providers/gateway/index.d.ts.map +1 -1
- package/dist/providers/gateway/index.js +18 -0
- package/dist/providers/gateway/index.js.map +1 -1
- package/dist/providers/google/index.d.ts +5 -0
- package/dist/providers/google/index.d.ts.map +1 -1
- package/dist/providers/google/index.js +19 -11
- package/dist/providers/google/index.js.map +1 -1
- package/dist/providers/hume/index.d.ts +9 -0
- package/dist/providers/hume/index.d.ts.map +1 -1
- package/dist/providers/hume/index.js +26 -0
- package/dist/providers/hume/index.js.map +1 -1
- package/dist/providers/inworld/index.d.ts +10 -0
- package/dist/providers/inworld/index.d.ts.map +1 -1
- package/dist/providers/inworld/index.js +34 -8
- package/dist/providers/inworld/index.js.map +1 -1
- package/dist/providers/mistral/index.d.ts +7 -0
- package/dist/providers/mistral/index.d.ts.map +1 -1
- package/dist/providers/mistral/index.js +24 -10
- package/dist/providers/mistral/index.js.map +1 -1
- package/dist/providers/murf/index.d.ts +8 -0
- package/dist/providers/murf/index.d.ts.map +1 -1
- package/dist/providers/murf/index.js +40 -1
- package/dist/providers/murf/index.js.map +1 -1
- package/dist/providers/openai/index.d.ts +7 -0
- package/dist/providers/openai/index.d.ts.map +1 -1
- package/dist/providers/openai/index.js +27 -0
- package/dist/providers/openai/index.js.map +1 -1
- package/dist/providers/resemble/index.d.ts +14 -0
- package/dist/providers/resemble/index.d.ts.map +1 -1
- package/dist/providers/resemble/index.js +35 -1
- package/dist/providers/resemble/index.js.map +1 -1
- package/dist/providers/smallest-ai/index.d.ts +47 -0
- package/dist/providers/smallest-ai/index.d.ts.map +1 -0
- package/dist/providers/smallest-ai/index.js +107 -0
- package/dist/providers/smallest-ai/index.js.map +1 -0
- package/dist/providers/xai/index.d.ts +18 -0
- package/dist/providers/xai/index.d.ts.map +1 -1
- package/dist/providers/xai/index.js +27 -0
- package/dist/providers/xai/index.js.map +1 -1
- package/dist/providers.d.ts +2 -0
- package/dist/providers.d.ts.map +1 -1
- package/dist/providers.js +1 -0
- package/dist/providers.js.map +1 -1
- package/dist/retry-options.d.ts +6 -0
- package/dist/retry-options.d.ts.map +1 -0
- package/dist/retry-options.js +48 -0
- package/dist/retry-options.js.map +1 -0
- package/dist/sentence-boundaries.d.ts +3 -0
- package/dist/sentence-boundaries.d.ts.map +1 -0
- package/dist/sentence-boundaries.js +3 -0
- package/dist/sentence-boundaries.js.map +1 -0
- package/dist/speech-provider.d.ts +17 -0
- package/dist/speech-provider.d.ts.map +1 -1
- package/dist/speech-provider.js +4 -0
- package/dist/speech-provider.js.map +1 -1
- package/dist/stream-speech.d.ts +5 -2
- package/dist/stream-speech.d.ts.map +1 -1
- package/dist/stream-speech.js +38 -21
- package/dist/stream-speech.js.map +1 -1
- package/dist/text-chunker.d.ts +13 -0
- package/dist/text-chunker.d.ts.map +1 -0
- package/dist/text-chunker.js +194 -0
- package/dist/text-chunker.js.map +1 -0
- package/dist/types.d.ts +7 -2
- package/dist/types.d.ts.map +1 -1
- package/dist/volume-adjust.d.ts.map +1 -1
- package/dist/volume-adjust.js +4 -10
- package/dist/volume-adjust.js.map +1 -1
- package/package.json +9 -5
- package/NOTICE +0 -27
package/dist/stream-speech.js
CHANGED
|
@@ -1,14 +1,20 @@
|
|
|
1
1
|
import pRetry from "p-retry";
|
|
2
2
|
import { detectAudioTags, stripAudioTags } from "./audio-tags.js";
|
|
3
|
-
import {
|
|
4
|
-
import {
|
|
3
|
+
import { assertGatewayForModerationRulesetId, NoSpeechGeneratedError, StreamingNotSupportedError, } from "./errors.js";
|
|
4
|
+
import { mergeRules } from "./pronunciations/merge.js";
|
|
5
|
+
import { substitute } from "./pronunciations/substitute.js";
|
|
6
|
+
import { validatePronunciationsInput } from "./pronunciations/validate.js";
|
|
5
7
|
import { resolveModel } from "./resolve-provider.js";
|
|
6
|
-
import {
|
|
8
|
+
import { buildRetryOptions } from "./retry-options.js";
|
|
9
|
+
import { FEATURES, hasFeature, isSpeechGatewayModel, } from "./speech-provider.js";
|
|
7
10
|
export async function streamSpeech(options) {
|
|
8
11
|
const { model, voice, providerOptions, abortSignal, headers } = options;
|
|
9
12
|
const maxRetries = options.maxRetries ?? 2;
|
|
10
13
|
const resolved = resolveModel(model, { apiKey: options.apiKey });
|
|
11
14
|
const modelIdentifier = `${resolved.provider.id}/${resolved.modelId}`;
|
|
15
|
+
const isGateway = isSpeechGatewayModel(resolved);
|
|
16
|
+
validatePronunciationsInput(options.pronunciations, isGateway);
|
|
17
|
+
assertGatewayForModerationRulesetId(options.moderationRulesetId, isGateway);
|
|
12
18
|
const modelInfo = resolved.provider.models.find((m) => m.id === resolved.modelId);
|
|
13
19
|
if (modelInfo && !hasFeature(modelInfo, FEATURES.STREAMING)) {
|
|
14
20
|
throw new StreamingNotSupportedError(modelIdentifier);
|
|
@@ -36,30 +42,41 @@ export async function streamSpeech(options) {
|
|
|
36
42
|
? `Text is empty after removing unsupported audio tags for ${modelIdentifier}.`
|
|
37
43
|
: "Text must not be empty.");
|
|
38
44
|
}
|
|
45
|
+
let textToSend = processedText;
|
|
46
|
+
if (!isGateway && options.pronunciations?.rules?.length) {
|
|
47
|
+
const ruleMap = mergeRules(options.pronunciations.rules);
|
|
48
|
+
textToSend = substitute(processedText, ruleMap).text;
|
|
49
|
+
}
|
|
39
50
|
const streamFn = resolved.provider.stream.bind(resolved.provider);
|
|
40
51
|
const startTime = performance.now();
|
|
41
|
-
const result = await pRetry(() =>
|
|
42
|
-
|
|
43
|
-
|
|
44
|
-
|
|
45
|
-
|
|
46
|
-
|
|
47
|
-
|
|
48
|
-
|
|
49
|
-
|
|
50
|
-
|
|
51
|
-
|
|
52
|
-
|
|
53
|
-
|
|
54
|
-
|
|
55
|
-
|
|
56
|
-
|
|
57
|
-
|
|
52
|
+
const result = await pRetry(() => {
|
|
53
|
+
if (isGateway) {
|
|
54
|
+
const gatewayProvider = resolved.provider;
|
|
55
|
+
return gatewayProvider.stream({
|
|
56
|
+
modelId: resolved.modelId,
|
|
57
|
+
text: textToSend,
|
|
58
|
+
voice: voice,
|
|
59
|
+
providerOptions,
|
|
60
|
+
abortSignal,
|
|
61
|
+
headers,
|
|
62
|
+
pronunciations: options.pronunciations,
|
|
63
|
+
moderationRulesetId: options.moderationRulesetId,
|
|
64
|
+
});
|
|
65
|
+
}
|
|
66
|
+
return streamFn({
|
|
67
|
+
modelId: resolved.modelId,
|
|
68
|
+
text: textToSend,
|
|
69
|
+
voice,
|
|
70
|
+
providerOptions,
|
|
71
|
+
abortSignal,
|
|
72
|
+
headers,
|
|
73
|
+
});
|
|
74
|
+
}, buildRetryOptions({ maxRetries, abortSignal }));
|
|
58
75
|
const ttfbMs = Math.round(performance.now() - startTime);
|
|
59
76
|
const metadata = {
|
|
60
77
|
latencyMs: ttfbMs,
|
|
61
78
|
ttfbMs,
|
|
62
|
-
inputChars:
|
|
79
|
+
inputChars: options.text.length,
|
|
63
80
|
...(result.audioDurationMs != null && {
|
|
64
81
|
audioDurationMs: result.audioDurationMs,
|
|
65
82
|
}),
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"stream-speech.js","sourceRoot":"","sources":["../src/stream-speech.ts"],"names":[],"mappings":"AAAA,OAAO,MAAM,MAAM,SAAS,CAAC;AAC7B,OAAO,EAAE,eAAe,EAAE,cAAc,EAAE,MAAM,iBAAiB,CAAC;AAClE,OAAO,EACL,
|
|
1
|
+
{"version":3,"file":"stream-speech.js","sourceRoot":"","sources":["../src/stream-speech.ts"],"names":[],"mappings":"AAAA,OAAO,MAAM,MAAM,SAAS,CAAC;AAC7B,OAAO,EAAE,eAAe,EAAE,cAAc,EAAE,MAAM,iBAAiB,CAAC;AAClE,OAAO,EACL,mCAAmC,EACnC,sBAAsB,EACtB,0BAA0B,GAC3B,MAAM,aAAa,CAAC;AAErB,OAAO,EAAE,UAAU,EAAE,MAAM,2BAA2B,CAAC;AACvD,OAAO,EAAE,UAAU,EAAE,MAAM,gCAAgC,CAAC;AAE5D,OAAO,EAAE,2BAA2B,EAAE,MAAM,8BAA8B,CAAC;AAE3E,OAAO,EAAE,YAAY,EAAE,MAAM,uBAAuB,CAAC;AACrD,OAAO,EAAE,iBAAiB,EAAE,MAAM,oBAAoB,CAAC;AACvD,OAAO,EACL,QAAQ,EACR,UAAU,EACV,oBAAoB,GAGrB,MAAM,sBAAsB,CAAC;AAG9B,MAAM,CAAC,KAAK,UAAU,YAAY,CAGhC,OAWD;IACC,MAAM,EAAE,KAAK,EAAE,KAAK,EAAE,eAAe,EAAE,WAAW,EAAE,OAAO,EAAE,GAAG,OAAO,CAAC;IACxE,MAAM,UAAU,GAAG,OAAO,CAAC,UAAU,IAAI,CAAC,CAAC;IAE3C,MAAM,QAAQ,GAAG,YAAY,CAAC,KAAK,EAAE,EAAE,MAAM,EAAE,OAAO,CAAC,MAAM,EAAE,CAAC,CAAC;IACjE,MAAM,eAAe,GAAG,GAAG,QAAQ,CAAC,QAAQ,CAAC,EAAE,IAAI,QAAQ,CAAC,OAAO,EAAE,CAAC;IACtE,MAAM,SAAS,GAAG,oBAAoB,CAAC,QAAQ,CAAC,CAAC;IACjD,2BAA2B,CAAC,OAAO,CAAC,cAAc,EAAE,SAAS,CAAC,CAAC;IAC/D,mCAAmC,CAAC,OAAO,CAAC,mBAAmB,EAAE,SAAS,CAAC,CAAC;IAE5E,MAAM,SAAS,GAAG,QAAQ,CAAC,QAAQ,CAAC,MAAM,CAAC,IAAI,CAC7C,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC,EAAE,KAAK,QAAQ,CAAC,OAAO,CACjC,CAAC;IACF,IAAI,SAAS,IAAI,CAAC,UAAU,CAAC,SAAS,EAAE,QAAQ,CAAC,SAAS,CAAC,EAAE,CAAC;QAC5D,MAAM,IAAI,0BAA0B,CAAC,eAAe,CAAC,CAAC;IACxD,CAAC;IACD,IAAI,OAAO,QAAQ,CAAC,QAAQ,CAAC,MAAM,KAAK,UAAU,EAAE,CAAC;QACnD,MAAM,IAAI,0BAA0B,CAAC,eAAe,CAAC,CAAC;IACxD,CAAC;IAED,IAAI,aAAqB,CAAC;IAC1B,IAAI,QAAkB,CAAC;IAEvB,IAAI,QAAQ,CAAC,QAAQ,CAAC,gBAAgB,EAAE,CAAC;QACvC,CAAC,EAAE,IAAI,EAAE,aAAa,EAAE,QAAQ,EAAE,GAAG,QAAQ,CAAC,QAAQ,CAAC,gBAAgB,CACrE,OAAO,CAAC,IAAI,EACZ,QAAQ,CAAC,OAAO,CACjB,CAAC,CAAC;IACL,CAAC;SAAM,CAAC;QACN,MAAM,IAAI,GAAG,eAAe,CAAC,OAAO,CAAC,IAAI,CAAC,CAAC;QAC3C,IAAI,IAAI,CAAC,MAAM,GAAG,CAAC,EAAE,CAAC;YACpB,CAAC,EAAE,IAAI,EAAE,aAAa,EAAE,QAAQ,EAAE,GAAG,cAAc,CACjD,OAAO,CAAC,IAAI,EACZ,eAAe,CAChB,CAAC,CAAC;QACL,CAAC;aAAM,CAAC;YACN,aAAa,GAAG,OAAO,CAAC,IAAI,CAAC;YAC7B,QAAQ,GAAG,EAAE,CAAC;QAChB,CAAC;IACH,CAAC;IAED,IAAI,aAAa,CAAC,IAAI,EAAE,CAAC,MAAM,KAAK,CAAC,EAAE,CAAC;QACtC,MAAM,IAAI,sBAAsB,CAC9B,QAAQ,CAAC,MAAM,GAAG,CAAC;YACjB,CAAC,CAAC,2DAA2D,eAAe,GAAG;YAC/E,CAAC,CAAC,yBAAyB,CAC9B,CAAC;IACJ,CAAC;IAED,IAAI,UAAU,GAAG,aAAa,CAAC;IAC/B,IAAI,CAAC,SAAS,IAAI,OAAO,CAAC,cAAc,EAAE,KAAK,EAAE,MAAM,EAAE,CAAC;QACxD,MAAM,OAAO,GAAG,UAAU,CAAC,OAAO,CAAC,cAAc,CAAC,KAAK,CAAC,CAAC;QACzD,UAAU,GAAG,UAAU,CAAC,aAAa,EAAE,OAAO,CAAC,CAAC,IAAI,CAAC;IACvD,CAAC;IAED,MAAM,QAAQ,GAAG,QAAQ,CAAC,QAAQ,CAAC,MAAM,CAAC,IAAI,CAAC,QAAQ,CAAC,QAAQ,CAAC,CAAC;IAElE,MAAM,SAAS,GAAG,WAAW,CAAC,GAAG,EAAE,CAAC;IAEpC,MAAM,MAAM,GAAG,MAAM,MAAM,CAAC,GAAG,EAAE;QAC/B,IAAI,SAAS,EAAE,CAAC;YACd,MAAM,eAAe,GAAG,QAAQ,CAAC,QAAiC,CAAC;YACnE,OAAO,eAAe,CAAC,MAAM,CAAC;gBAC5B,OAAO,EAAE,QAAQ,CAAC,OAAO;gBACzB,IAAI,EAAE,UAAU;gBAChB,KAAK,EAAE,KAA0B;gBACjC,eAAe;gBACf,WAAW;gBACX,OAAO;gBACP,cAAc,EAAE,OAAO,CAAC,cAAc;gBACtC,mBAAmB,EAAE,OAAO,CAAC,mBAAmB;aACjD,CAAC,CAAC;QACL,CAAC;QACD,OAAO,QAAQ,CAAC;YACd,OAAO,EAAE,QAAQ,CAAC,OAAO;YACzB,IAAI,EAAE,UAAU;YAChB,KAAK;YACL,eAAe;YACf,WAAW;YACX,OAAO;SACR,CAAC,CAAC;IACL,CAAC,EAAE,iBAAiB,CAAC,EAAE,UAAU,EAAE,WAAW,EAAE,CAAC,CAAC,CAAC;IAEnD,MAAM,MAAM,GAAG,IAAI,CAAC,KAAK,CAAC,WAAW,CAAC,GAAG,EAAE,GAAG,SAAS,CAAC,CAAC;IAEzD,MAAM,QAAQ,GAAmB;QAC/B,SAAS,EAAE,MAAM;QACjB,MAAM;QACN,UAAU,EAAE,OAAO,CAAC,IAAI,CAAC,MAAM;QAC/B,GAAG,CAAC,MAAM,CAAC,eAAe,IAAI,IAAI,IAAI;YACpC,eAAe,EAAE,MAAM,CAAC,eAAe;SACxC,CAAC;KACH,CAAC;IAEF,OAAO;QACL,KAAK,EAAE,MAAM,CAAC,MAAM;QACpB,SAAS,EAAE,MAAM,CAAC,SAAS;QAC3B,QAAQ;QACR,gBAAgB,EAAE,MAAM,CAAC,gBAAgB;QACzC,QAAQ,EAAE,QAAQ,CAAC,MAAM,GAAG,CAAC,CAAC,CAAC,CAAC,QAAQ,CAAC,CAAC,CAAC,SAAS;KACrD,CAAC;AACJ,CAAC"}
|
|
@@ -0,0 +1,13 @@
|
|
|
1
|
+
export interface MaxInputCharsResolution {
|
|
2
|
+
readonly providerMaxInputChars?: number;
|
|
3
|
+
readonly source?: "provider" | "user";
|
|
4
|
+
readonly userExceedsProvider: boolean;
|
|
5
|
+
readonly userMaxInputChars?: number;
|
|
6
|
+
readonly value?: number;
|
|
7
|
+
}
|
|
8
|
+
export declare function resolveMaxInputChars(args: {
|
|
9
|
+
providerMaxInputChars: number | undefined;
|
|
10
|
+
userMaxInputChars: number | undefined;
|
|
11
|
+
}): MaxInputCharsResolution;
|
|
12
|
+
export declare function splitTextByMaxChars(text: string, maxChars: number): string[];
|
|
13
|
+
//# sourceMappingURL=text-chunker.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"text-chunker.d.ts","sourceRoot":"","sources":["../src/text-chunker.ts"],"names":[],"mappings":"AAeA,MAAM,WAAW,uBAAuB;IACtC,QAAQ,CAAC,qBAAqB,CAAC,EAAE,MAAM,CAAC;IACxC,QAAQ,CAAC,MAAM,CAAC,EAAE,UAAU,GAAG,MAAM,CAAC;IACtC,QAAQ,CAAC,mBAAmB,EAAE,OAAO,CAAC;IACtC,QAAQ,CAAC,iBAAiB,CAAC,EAAE,MAAM,CAAC;IACpC,QAAQ,CAAC,KAAK,CAAC,EAAE,MAAM,CAAC;CACzB;AAED,wBAAgB,oBAAoB,CAAC,IAAI,EAAE;IACzC,qBAAqB,EAAE,MAAM,GAAG,SAAS,CAAC;IAC1C,iBAAiB,EAAE,MAAM,GAAG,SAAS,CAAC;CACvC,GAAG,uBAAuB,CA0B1B;AAED,wBAAgB,mBAAmB,CAAC,IAAI,EAAE,MAAM,EAAE,QAAQ,EAAE,MAAM,GAAG,MAAM,EAAE,CA4C5E"}
|
|
@@ -0,0 +1,194 @@
|
|
|
1
|
+
import { z } from "zod";
|
|
2
|
+
import { SENTENCE_BOUNDARY_RE } from "./sentence-boundaries.js";
|
|
3
|
+
const WHITESPACE_RE = /\s+/g;
|
|
4
|
+
const LEADING_WHITESPACE_RE = /\s/;
|
|
5
|
+
const WHITESPACE_BREAK_PENALTY = 512;
|
|
6
|
+
const MAX_INPUT_CHARS_SCHEMA = z.number().finite().int().positive();
|
|
7
|
+
const MAX_INPUT_CHARS_RESOLUTION_SCHEMA = z.object({
|
|
8
|
+
providerMaxInputChars: MAX_INPUT_CHARS_SCHEMA.optional(),
|
|
9
|
+
userMaxInputChars: MAX_INPUT_CHARS_SCHEMA.optional(),
|
|
10
|
+
});
|
|
11
|
+
const SPLIT_TEXT_OPTIONS_SCHEMA = z.object({
|
|
12
|
+
maxChars: MAX_INPUT_CHARS_SCHEMA,
|
|
13
|
+
});
|
|
14
|
+
export function resolveMaxInputChars(args) {
|
|
15
|
+
const { providerMaxInputChars, userMaxInputChars } = parseWithMessage(MAX_INPUT_CHARS_RESOLUTION_SCHEMA, args, "maxInputChars must be a positive integer.");
|
|
16
|
+
if (userMaxInputChars != null) {
|
|
17
|
+
return {
|
|
18
|
+
providerMaxInputChars,
|
|
19
|
+
source: "user",
|
|
20
|
+
userExceedsProvider: providerMaxInputChars != null &&
|
|
21
|
+
userMaxInputChars > providerMaxInputChars,
|
|
22
|
+
userMaxInputChars,
|
|
23
|
+
value: userMaxInputChars,
|
|
24
|
+
};
|
|
25
|
+
}
|
|
26
|
+
if (providerMaxInputChars != null) {
|
|
27
|
+
return {
|
|
28
|
+
providerMaxInputChars,
|
|
29
|
+
source: "provider",
|
|
30
|
+
userExceedsProvider: false,
|
|
31
|
+
value: providerMaxInputChars,
|
|
32
|
+
};
|
|
33
|
+
}
|
|
34
|
+
return { userExceedsProvider: false };
|
|
35
|
+
}
|
|
36
|
+
export function splitTextByMaxChars(text, maxChars) {
|
|
37
|
+
const { maxChars: resolvedMaxChars } = parseWithMessage(SPLIT_TEXT_OPTIONS_SCHEMA, { maxChars }, "splitTextByMaxChars: maxChars must be a positive integer.");
|
|
38
|
+
const trimmed = text.trim();
|
|
39
|
+
if (trimmed.length <= resolvedMaxChars) {
|
|
40
|
+
return trimmed.length > 0 ? [trimmed] : [];
|
|
41
|
+
}
|
|
42
|
+
const breakCandidates = collectBreakCandidates(trimmed);
|
|
43
|
+
const chunks = [];
|
|
44
|
+
const chunkCount = Math.ceil(trimmed.length / resolvedMaxChars);
|
|
45
|
+
let start = 0;
|
|
46
|
+
for (let chunkIndex = 1; chunkIndex < chunkCount; chunkIndex++) {
|
|
47
|
+
const remainingChunks = chunkCount - chunkIndex;
|
|
48
|
+
const remainingLength = trimmed.length - start;
|
|
49
|
+
const idealEnd = start + Math.round(remainingLength / (remainingChunks + 1));
|
|
50
|
+
const minEnd = Math.max(start + 1, trimmed.length - remainingChunks * resolvedMaxChars);
|
|
51
|
+
const maxEnd = Math.min(start + resolvedMaxChars, trimmed.length - remainingChunks);
|
|
52
|
+
const target = clamp(idealEnd, minEnd, maxEnd);
|
|
53
|
+
const splitIndex = findSplitIndex({ breakCandidates, target, minEnd, maxEnd }) ??
|
|
54
|
+
safeSplitIndex(trimmed, target, minEnd, maxEnd);
|
|
55
|
+
const chunk = trimmed.slice(start, splitIndex).trim();
|
|
56
|
+
if (chunk.length > 0) {
|
|
57
|
+
chunks.push(chunk);
|
|
58
|
+
}
|
|
59
|
+
start = skipLeadingWhitespace(trimmed, splitIndex);
|
|
60
|
+
}
|
|
61
|
+
const finalChunk = trimmed.slice(start).trim();
|
|
62
|
+
if (finalChunk.length > 0) {
|
|
63
|
+
chunks.push(finalChunk);
|
|
64
|
+
}
|
|
65
|
+
return chunks;
|
|
66
|
+
}
|
|
67
|
+
function parseWithMessage(schema, value, message) {
|
|
68
|
+
try {
|
|
69
|
+
return schema.parse(value);
|
|
70
|
+
}
|
|
71
|
+
catch (err) {
|
|
72
|
+
if (err instanceof z.ZodError) {
|
|
73
|
+
throw new Error(message);
|
|
74
|
+
}
|
|
75
|
+
throw err;
|
|
76
|
+
}
|
|
77
|
+
}
|
|
78
|
+
function safeSplitIndex(text, index, minEnd, maxEnd) {
|
|
79
|
+
if (!isSurrogateBoundary(text, index)) {
|
|
80
|
+
return index;
|
|
81
|
+
}
|
|
82
|
+
const candidates = [index + 1, index - 1];
|
|
83
|
+
for (const candidate of candidates) {
|
|
84
|
+
if (candidate >= minEnd &&
|
|
85
|
+
candidate <= maxEnd &&
|
|
86
|
+
!isSurrogateBoundary(text, candidate)) {
|
|
87
|
+
return candidate;
|
|
88
|
+
}
|
|
89
|
+
}
|
|
90
|
+
return (candidates.find((candidate) => !isSurrogateBoundary(text, candidate)) ??
|
|
91
|
+
index);
|
|
92
|
+
}
|
|
93
|
+
function isSurrogateBoundary(text, index) {
|
|
94
|
+
if (index <= 0 || index >= text.length) {
|
|
95
|
+
return false;
|
|
96
|
+
}
|
|
97
|
+
const before = text.charCodeAt(index - 1);
|
|
98
|
+
const after = text.charCodeAt(index);
|
|
99
|
+
return (before >= 0xd8_00 &&
|
|
100
|
+
before <= 0xdb_ff &&
|
|
101
|
+
after >= 0xdc_00 &&
|
|
102
|
+
after <= 0xdf_ff);
|
|
103
|
+
}
|
|
104
|
+
function collectBreakCandidates(text) {
|
|
105
|
+
return {
|
|
106
|
+
paragraph: collectLiteralBreaks(text, "\n\n"),
|
|
107
|
+
line: collectLiteralBreaks(text, "\n"),
|
|
108
|
+
sentence: collectRegexBreaks(text, SENTENCE_BOUNDARY_RE),
|
|
109
|
+
whitespace: collectRegexBreaks(text, WHITESPACE_RE),
|
|
110
|
+
};
|
|
111
|
+
}
|
|
112
|
+
function collectLiteralBreaks(text, literal) {
|
|
113
|
+
const breaks = [];
|
|
114
|
+
let index = text.indexOf(literal);
|
|
115
|
+
while (index !== -1) {
|
|
116
|
+
breaks.push(index + literal.length);
|
|
117
|
+
index = text.indexOf(literal, index + literal.length);
|
|
118
|
+
}
|
|
119
|
+
return breaks;
|
|
120
|
+
}
|
|
121
|
+
function collectRegexBreaks(text, regex) {
|
|
122
|
+
const breaks = [];
|
|
123
|
+
regex.lastIndex = 0;
|
|
124
|
+
let match = regex.exec(text);
|
|
125
|
+
while (match) {
|
|
126
|
+
breaks.push(match.index + match[0].length);
|
|
127
|
+
if (match[0].length === 0) {
|
|
128
|
+
regex.lastIndex++;
|
|
129
|
+
}
|
|
130
|
+
match = regex.exec(text);
|
|
131
|
+
}
|
|
132
|
+
return breaks;
|
|
133
|
+
}
|
|
134
|
+
function findSplitIndex(args) {
|
|
135
|
+
let best;
|
|
136
|
+
const candidateGroups = [
|
|
137
|
+
{ breaks: args.breakCandidates.paragraph, penalty: 0 },
|
|
138
|
+
{ breaks: args.breakCandidates.line, penalty: 16 },
|
|
139
|
+
{ breaks: args.breakCandidates.sentence, penalty: 32 },
|
|
140
|
+
{
|
|
141
|
+
breaks: args.breakCandidates.whitespace,
|
|
142
|
+
penalty: WHITESPACE_BREAK_PENALTY,
|
|
143
|
+
},
|
|
144
|
+
];
|
|
145
|
+
for (const group of candidateGroups) {
|
|
146
|
+
for (const index of nearestCandidates(group.breaks, args.target)) {
|
|
147
|
+
if (index < args.minEnd || index > args.maxEnd) {
|
|
148
|
+
continue;
|
|
149
|
+
}
|
|
150
|
+
const score = Math.abs(index - args.target) + group.penalty;
|
|
151
|
+
if (!best || score < best.score) {
|
|
152
|
+
best = { index, score };
|
|
153
|
+
}
|
|
154
|
+
}
|
|
155
|
+
}
|
|
156
|
+
return best?.index;
|
|
157
|
+
}
|
|
158
|
+
function nearestCandidates(breaks, target) {
|
|
159
|
+
const upper = lowerBound(breaks, target);
|
|
160
|
+
const candidates = [];
|
|
161
|
+
const lower = upper - 1;
|
|
162
|
+
if (lower >= 0) {
|
|
163
|
+
candidates.push(breaks[lower] ?? 0);
|
|
164
|
+
}
|
|
165
|
+
if (upper < breaks.length) {
|
|
166
|
+
candidates.push(breaks[upper] ?? 0);
|
|
167
|
+
}
|
|
168
|
+
return candidates;
|
|
169
|
+
}
|
|
170
|
+
function lowerBound(values, target) {
|
|
171
|
+
let low = 0;
|
|
172
|
+
let high = values.length;
|
|
173
|
+
while (low < high) {
|
|
174
|
+
const mid = Math.floor((low + high) / 2);
|
|
175
|
+
if ((values[mid] ?? 0) < target) {
|
|
176
|
+
low = mid + 1;
|
|
177
|
+
}
|
|
178
|
+
else {
|
|
179
|
+
high = mid;
|
|
180
|
+
}
|
|
181
|
+
}
|
|
182
|
+
return low;
|
|
183
|
+
}
|
|
184
|
+
function clamp(value, min, max) {
|
|
185
|
+
return Math.min(Math.max(value, min), max);
|
|
186
|
+
}
|
|
187
|
+
function skipLeadingWhitespace(text, index) {
|
|
188
|
+
let next = index;
|
|
189
|
+
while (next < text.length && LEADING_WHITESPACE_RE.test(text[next] ?? "")) {
|
|
190
|
+
next++;
|
|
191
|
+
}
|
|
192
|
+
return next;
|
|
193
|
+
}
|
|
194
|
+
//# sourceMappingURL=text-chunker.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"text-chunker.js","sourceRoot":"","sources":["../src/text-chunker.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,CAAC,EAAE,MAAM,KAAK,CAAC;AACxB,OAAO,EAAE,oBAAoB,EAAE,MAAM,0BAA0B,CAAC;AAEhE,MAAM,aAAa,GAAG,MAAM,CAAC;AAC7B,MAAM,qBAAqB,GAAG,IAAI,CAAC;AACnC,MAAM,wBAAwB,GAAG,GAAG,CAAC;AACrC,MAAM,sBAAsB,GAAG,CAAC,CAAC,MAAM,EAAE,CAAC,MAAM,EAAE,CAAC,GAAG,EAAE,CAAC,QAAQ,EAAE,CAAC;AACpE,MAAM,iCAAiC,GAAG,CAAC,CAAC,MAAM,CAAC;IACjD,qBAAqB,EAAE,sBAAsB,CAAC,QAAQ,EAAE;IACxD,iBAAiB,EAAE,sBAAsB,CAAC,QAAQ,EAAE;CACrD,CAAC,CAAC;AACH,MAAM,yBAAyB,GAAG,CAAC,CAAC,MAAM,CAAC;IACzC,QAAQ,EAAE,sBAAsB;CACjC,CAAC,CAAC;AAUH,MAAM,UAAU,oBAAoB,CAAC,IAGpC;IACC,MAAM,EAAE,qBAAqB,EAAE,iBAAiB,EAAE,GAAG,gBAAgB,CACnE,iCAAiC,EACjC,IAAI,EACJ,2CAA2C,CAC5C,CAAC;IACF,IAAI,iBAAiB,IAAI,IAAI,EAAE,CAAC;QAC9B,OAAO;YACL,qBAAqB;YACrB,MAAM,EAAE,MAAM;YACd,mBAAmB,EACjB,qBAAqB,IAAI,IAAI;gBAC7B,iBAAiB,GAAG,qBAAqB;YAC3C,iBAAiB;YACjB,KAAK,EAAE,iBAAiB;SACzB,CAAC;IACJ,CAAC;IACD,IAAI,qBAAqB,IAAI,IAAI,EAAE,CAAC;QAClC,OAAO;YACL,qBAAqB;YACrB,MAAM,EAAE,UAAU;YAClB,mBAAmB,EAAE,KAAK;YAC1B,KAAK,EAAE,qBAAqB;SAC7B,CAAC;IACJ,CAAC;IACD,OAAO,EAAE,mBAAmB,EAAE,KAAK,EAAE,CAAC;AACxC,CAAC;AAED,MAAM,UAAU,mBAAmB,CAAC,IAAY,EAAE,QAAgB;IAChE,MAAM,EAAE,QAAQ,EAAE,gBAAgB,EAAE,GAAG,gBAAgB,CACrD,yBAAyB,EACzB,EAAE,QAAQ,EAAE,EACZ,2DAA2D,CAC5D,CAAC;IACF,MAAM,OAAO,GAAG,IAAI,CAAC,IAAI,EAAE,CAAC;IAC5B,IAAI,OAAO,CAAC,MAAM,IAAI,gBAAgB,EAAE,CAAC;QACvC,OAAO,OAAO,CAAC,MAAM,GAAG,CAAC,CAAC,CAAC,CAAC,CAAC,OAAO,CAAC,CAAC,CAAC,CAAC,EAAE,CAAC;IAC7C,CAAC;IAED,MAAM,eAAe,GAAG,sBAAsB,CAAC,OAAO,CAAC,CAAC;IACxD,MAAM,MAAM,GAAa,EAAE,CAAC;IAC5B,MAAM,UAAU,GAAG,IAAI,CAAC,IAAI,CAAC,OAAO,CAAC,MAAM,GAAG,gBAAgB,CAAC,CAAC;IAChE,IAAI,KAAK,GAAG,CAAC,CAAC;IAEd,KAAK,IAAI,UAAU,GAAG,CAAC,EAAE,UAAU,GAAG,UAAU,EAAE,UAAU,EAAE,EAAE,CAAC;QAC/D,MAAM,eAAe,GAAG,UAAU,GAAG,UAAU,CAAC;QAChD,MAAM,eAAe,GAAG,OAAO,CAAC,MAAM,GAAG,KAAK,CAAC;QAC/C,MAAM,QAAQ,GACZ,KAAK,GAAG,IAAI,CAAC,KAAK,CAAC,eAAe,GAAG,CAAC,eAAe,GAAG,CAAC,CAAC,CAAC,CAAC;QAC9D,MAAM,MAAM,GAAG,IAAI,CAAC,GAAG,CACrB,KAAK,GAAG,CAAC,EACT,OAAO,CAAC,MAAM,GAAG,eAAe,GAAG,gBAAgB,CACpD,CAAC;QACF,MAAM,MAAM,GAAG,IAAI,CAAC,GAAG,CACrB,KAAK,GAAG,gBAAgB,EACxB,OAAO,CAAC,MAAM,GAAG,eAAe,CACjC,CAAC;QACF,MAAM,MAAM,GAAG,KAAK,CAAC,QAAQ,EAAE,MAAM,EAAE,MAAM,CAAC,CAAC;QAC/C,MAAM,UAAU,GACd,cAAc,CAAC,EAAE,eAAe,EAAE,MAAM,EAAE,MAAM,EAAE,MAAM,EAAE,CAAC;YAC3D,cAAc,CAAC,OAAO,EAAE,MAAM,EAAE,MAAM,EAAE,MAAM,CAAC,CAAC;QAClD,MAAM,KAAK,GAAG,OAAO,CAAC,KAAK,CAAC,KAAK,EAAE,UAAU,CAAC,CAAC,IAAI,EAAE,CAAC;QACtD,IAAI,KAAK,CAAC,MAAM,GAAG,CAAC,EAAE,CAAC;YACrB,MAAM,CAAC,IAAI,CAAC,KAAK,CAAC,CAAC;QACrB,CAAC;QACD,KAAK,GAAG,qBAAqB,CAAC,OAAO,EAAE,UAAU,CAAC,CAAC;IACrD,CAAC;IACD,MAAM,UAAU,GAAG,OAAO,CAAC,KAAK,CAAC,KAAK,CAAC,CAAC,IAAI,EAAE,CAAC;IAC/C,IAAI,UAAU,CAAC,MAAM,GAAG,CAAC,EAAE,CAAC;QAC1B,MAAM,CAAC,IAAI,CAAC,UAAU,CAAC,CAAC;IAC1B,CAAC;IACD,OAAO,MAAM,CAAC;AAChB,CAAC;AAED,SAAS,gBAAgB,CACvB,MAAoB,EACpB,KAAc,EACd,OAAe;IAEf,IAAI,CAAC;QACH,OAAO,MAAM,CAAC,KAAK,CAAC,KAAK,CAAC,CAAC;IAC7B,CAAC;IAAC,OAAO,GAAG,EAAE,CAAC;QACb,IAAI,GAAG,YAAY,CAAC,CAAC,QAAQ,EAAE,CAAC;YAC9B,MAAM,IAAI,KAAK,CAAC,OAAO,CAAC,CAAC;QAC3B,CAAC;QACD,MAAM,GAAG,CAAC;IACZ,CAAC;AACH,CAAC;AAED,SAAS,cAAc,CACrB,IAAY,EACZ,KAAa,EACb,MAAc,EACd,MAAc;IAEd,IAAI,CAAC,mBAAmB,CAAC,IAAI,EAAE,KAAK,CAAC,EAAE,CAAC;QACtC,OAAO,KAAK,CAAC;IACf,CAAC;IAED,MAAM,UAAU,GAAG,CAAC,KAAK,GAAG,CAAC,EAAE,KAAK,GAAG,CAAC,CAAC,CAAC;IAC1C,KAAK,MAAM,SAAS,IAAI,UAAU,EAAE,CAAC;QACnC,IACE,SAAS,IAAI,MAAM;YACnB,SAAS,IAAI,MAAM;YACnB,CAAC,mBAAmB,CAAC,IAAI,EAAE,SAAS,CAAC,EACrC,CAAC;YACD,OAAO,SAAS,CAAC;QACnB,CAAC;IACH,CAAC;IAED,OAAO,CACL,UAAU,CAAC,IAAI,CAAC,CAAC,SAAS,EAAE,EAAE,CAAC,CAAC,mBAAmB,CAAC,IAAI,EAAE,SAAS,CAAC,CAAC;QACrE,KAAK,CACN,CAAC;AACJ,CAAC;AAED,SAAS,mBAAmB,CAAC,IAAY,EAAE,KAAa;IACtD,IAAI,KAAK,IAAI,CAAC,IAAI,KAAK,IAAI,IAAI,CAAC,MAAM,EAAE,CAAC;QACvC,OAAO,KAAK,CAAC;IACf,CAAC;IACD,MAAM,MAAM,GAAG,IAAI,CAAC,UAAU,CAAC,KAAK,GAAG,CAAC,CAAC,CAAC;IAC1C,MAAM,KAAK,GAAG,IAAI,CAAC,UAAU,CAAC,KAAK,CAAC,CAAC;IACrC,OAAO,CACL,MAAM,IAAI,OAAO;QACjB,MAAM,IAAI,OAAO;QACjB,KAAK,IAAI,OAAO;QAChB,KAAK,IAAI,OAAO,CACjB,CAAC;AACJ,CAAC;AASD,SAAS,sBAAsB,CAAC,IAAY;IAC1C,OAAO;QACL,SAAS,EAAE,oBAAoB,CAAC,IAAI,EAAE,MAAM,CAAC;QAC7C,IAAI,EAAE,oBAAoB,CAAC,IAAI,EAAE,IAAI,CAAC;QACtC,QAAQ,EAAE,kBAAkB,CAAC,IAAI,EAAE,oBAAoB,CAAC;QACxD,UAAU,EAAE,kBAAkB,CAAC,IAAI,EAAE,aAAa,CAAC;KACpD,CAAC;AACJ,CAAC;AAED,SAAS,oBAAoB,CAAC,IAAY,EAAE,OAAe;IACzD,MAAM,MAAM,GAAa,EAAE,CAAC;IAC5B,IAAI,KAAK,GAAG,IAAI,CAAC,OAAO,CAAC,OAAO,CAAC,CAAC;IAClC,OAAO,KAAK,KAAK,CAAC,CAAC,EAAE,CAAC;QACpB,MAAM,CAAC,IAAI,CAAC,KAAK,GAAG,OAAO,CAAC,MAAM,CAAC,CAAC;QACpC,KAAK,GAAG,IAAI,CAAC,OAAO,CAAC,OAAO,EAAE,KAAK,GAAG,OAAO,CAAC,MAAM,CAAC,CAAC;IACxD,CAAC;IACD,OAAO,MAAM,CAAC;AAChB,CAAC;AAED,SAAS,kBAAkB,CAAC,IAAY,EAAE,KAAa;IACrD,MAAM,MAAM,GAAa,EAAE,CAAC;IAC5B,KAAK,CAAC,SAAS,GAAG,CAAC,CAAC;IACpB,IAAI,KAAK,GAAG,KAAK,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;IAC7B,OAAO,KAAK,EAAE,CAAC;QACb,MAAM,CAAC,IAAI,CAAC,KAAK,CAAC,KAAK,GAAG,KAAK,CAAC,CAAC,CAAC,CAAC,MAAM,CAAC,CAAC;QAC3C,IAAI,KAAK,CAAC,CAAC,CAAC,CAAC,MAAM,KAAK,CAAC,EAAE,CAAC;YAC1B,KAAK,CAAC,SAAS,EAAE,CAAC;QACpB,CAAC;QACD,KAAK,GAAG,KAAK,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;IAC3B,CAAC;IACD,OAAO,MAAM,CAAC;AAChB,CAAC;AAED,SAAS,cAAc,CAAC,IAKvB;IACC,IAAI,IAAkD,CAAC;IACvD,MAAM,eAAe,GAAG;QACtB,EAAE,MAAM,EAAE,IAAI,CAAC,eAAe,CAAC,SAAS,EAAE,OAAO,EAAE,CAAC,EAAE;QACtD,EAAE,MAAM,EAAE,IAAI,CAAC,eAAe,CAAC,IAAI,EAAE,OAAO,EAAE,EAAE,EAAE;QAClD,EAAE,MAAM,EAAE,IAAI,CAAC,eAAe,CAAC,QAAQ,EAAE,OAAO,EAAE,EAAE,EAAE;QACtD;YACE,MAAM,EAAE,IAAI,CAAC,eAAe,CAAC,UAAU;YACvC,OAAO,EAAE,wBAAwB;SAClC;KACO,CAAC;IAEX,KAAK,MAAM,KAAK,IAAI,eAAe,EAAE,CAAC;QACpC,KAAK,MAAM,KAAK,IAAI,iBAAiB,CAAC,KAAK,CAAC,MAAM,EAAE,IAAI,CAAC,MAAM,CAAC,EAAE,CAAC;YACjE,IAAI,KAAK,GAAG,IAAI,CAAC,MAAM,IAAI,KAAK,GAAG,IAAI,CAAC,MAAM,EAAE,CAAC;gBAC/C,SAAS;YACX,CAAC;YACD,MAAM,KAAK,GAAG,IAAI,CAAC,GAAG,CAAC,KAAK,GAAG,IAAI,CAAC,MAAM,CAAC,GAAG,KAAK,CAAC,OAAO,CAAC;YAC5D,IAAI,CAAC,IAAI,IAAI,KAAK,GAAG,IAAI,CAAC,KAAK,EAAE,CAAC;gBAChC,IAAI,GAAG,EAAE,KAAK,EAAE,KAAK,EAAE,CAAC;YAC1B,CAAC;QACH,CAAC;IACH,CAAC;IACD,OAAO,IAAI,EAAE,KAAK,CAAC;AACrB,CAAC;AAED,SAAS,iBAAiB,CACxB,MAAyB,EACzB,MAAc;IAEd,MAAM,KAAK,GAAG,UAAU,CAAC,MAAM,EAAE,MAAM,CAAC,CAAC;IACzC,MAAM,UAAU,GAAa,EAAE,CAAC;IAChC,MAAM,KAAK,GAAG,KAAK,GAAG,CAAC,CAAC;IACxB,IAAI,KAAK,IAAI,CAAC,EAAE,CAAC;QACf,UAAU,CAAC,IAAI,CAAC,MAAM,CAAC,KAAK,CAAC,IAAI,CAAC,CAAC,CAAC;IACtC,CAAC;IACD,IAAI,KAAK,GAAG,MAAM,CAAC,MAAM,EAAE,CAAC;QAC1B,UAAU,CAAC,IAAI,CAAC,MAAM,CAAC,KAAK,CAAC,IAAI,CAAC,CAAC,CAAC;IACtC,CAAC;IACD,OAAO,UAAU,CAAC;AACpB,CAAC;AAED,SAAS,UAAU,CAAC,MAAyB,EAAE,MAAc;IAC3D,IAAI,GAAG,GAAG,CAAC,CAAC;IACZ,IAAI,IAAI,GAAG,MAAM,CAAC,MAAM,CAAC;IACzB,OAAO,GAAG,GAAG,IAAI,EAAE,CAAC;QAClB,MAAM,GAAG,GAAG,IAAI,CAAC,KAAK,CAAC,CAAC,GAAG,GAAG,IAAI,CAAC,GAAG,CAAC,CAAC,CAAC;QACzC,IAAI,CAAC,MAAM,CAAC,GAAG,CAAC,IAAI,CAAC,CAAC,GAAG,MAAM,EAAE,CAAC;YAChC,GAAG,GAAG,GAAG,GAAG,CAAC,CAAC;QAChB,CAAC;aAAM,CAAC;YACN,IAAI,GAAG,GAAG,CAAC;QACb,CAAC;IACH,CAAC;IACD,OAAO,GAAG,CAAC;AACb,CAAC;AAED,SAAS,KAAK,CAAC,KAAa,EAAE,GAAW,EAAE,GAAW;IACpD,OAAO,IAAI,CAAC,GAAG,CAAC,IAAI,CAAC,GAAG,CAAC,KAAK,EAAE,GAAG,CAAC,EAAE,GAAG,CAAC,CAAC;AAC7C,CAAC;AAED,SAAS,qBAAqB,CAAC,IAAY,EAAE,KAAa;IACxD,IAAI,IAAI,GAAG,KAAK,CAAC;IACjB,OAAO,IAAI,GAAG,IAAI,CAAC,MAAM,IAAI,qBAAqB,CAAC,IAAI,CAAC,IAAI,CAAC,IAAI,CAAC,IAAI,EAAE,CAAC,EAAE,CAAC;QAC1E,IAAI,EAAE,CAAC;IACT,CAAC;IACD,OAAO,IAAI,CAAC;AACd,CAAC"}
|
package/dist/types.d.ts
CHANGED
|
@@ -1,9 +1,11 @@
|
|
|
1
1
|
import type { AudioOutput } from "./audio-output.js";
|
|
2
|
+
import type { PronunciationsFor } from "./pronunciations/types.js";
|
|
2
3
|
import type { ResolvedModel, Voice } from "./speech-provider.js";
|
|
3
4
|
export type { AudioOutput, AudioOutputFormat } from "./audio-output.js";
|
|
4
5
|
export type { CaptionFormat, CaptionsOptions } from "./captions.js";
|
|
5
6
|
export type { ConversationTurn, GenerateConversationOptions, } from "./conversation/types.js";
|
|
6
7
|
export type { SpeechMetadata } from "./metadata.js";
|
|
8
|
+
export type { Pronunciation, PronunciationsInput, } from "./pronunciations/types.js";
|
|
7
9
|
export type { CartesiaSpeechProviderConfig } from "./providers/cartesia/index.js";
|
|
8
10
|
export type { DeepgramSpeechProviderConfig } from "./providers/deepgram/index.js";
|
|
9
11
|
export type { ElevenLabsSpeechProviderConfig } from "./providers/elevenlabs/index.js";
|
|
@@ -24,13 +26,16 @@ export type { ResolvedSTTModel, SpeechToTextProvider, STTModelInfo, } from "./sp
|
|
|
24
26
|
export type { StreamSpeechResult } from "./stream-speech-result.js";
|
|
25
27
|
export type { ConversationWordTimestamp, WordTimestamp, } from "./timestamps.js";
|
|
26
28
|
export type { TurnTimestamp } from "./turns.js";
|
|
27
|
-
export interface GenerateSpeechOptions<V extends Voice = Voice> {
|
|
29
|
+
export interface GenerateSpeechOptions<V extends Voice = Voice, M extends string | ResolvedModel<V> = string | ResolvedModel<V>> {
|
|
28
30
|
abortSignal?: AbortSignal;
|
|
29
31
|
apiKey?: string;
|
|
30
32
|
headers?: Record<string, string>;
|
|
33
|
+
maxInputChars?: number;
|
|
31
34
|
maxRetries?: number;
|
|
32
|
-
model:
|
|
35
|
+
model: M;
|
|
36
|
+
moderationRulesetId?: string;
|
|
33
37
|
output?: AudioOutput;
|
|
38
|
+
pronunciations?: PronunciationsFor<M>;
|
|
34
39
|
providerOptions?: Record<string, unknown>;
|
|
35
40
|
text: string;
|
|
36
41
|
timestamps?: boolean;
|
package/dist/types.d.ts.map
CHANGED
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"types.d.ts","sourceRoot":"","sources":["../src/types.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,EAAE,WAAW,EAAE,MAAM,mBAAmB,CAAC;AACrD,OAAO,KAAK,EAAE,aAAa,EAAE,KAAK,EAAE,MAAM,sBAAsB,CAAC;AAEjE,YAAY,EAAE,WAAW,EAAE,iBAAiB,EAAE,MAAM,mBAAmB,CAAC;AACxE,YAAY,EAAE,aAAa,EAAE,eAAe,EAAE,MAAM,eAAe,CAAC;AACpE,YAAY,EACV,gBAAgB,EAChB,2BAA2B,GAC5B,MAAM,yBAAyB,CAAC;AACjC,YAAY,EAAE,cAAc,EAAE,MAAM,eAAe,CAAC;AACpD,YAAY,EAAE,4BAA4B,EAAE,MAAM,+BAA+B,CAAC;AAClF,YAAY,EAAE,4BAA4B,EAAE,MAAM,+BAA+B,CAAC;AAClF,YAAY,EAAE,8BAA8B,EAAE,MAAM,iCAAiC,CAAC;AACtF,YAAY,EAAE,uBAAuB,EAAE,MAAM,0BAA0B,CAAC;AACxE,YAAY,EAAE,6BAA6B,EAAE,MAAM,iCAAiC,CAAC;AACrF,YAAY,EAAE,2BAA2B,EAAE,MAAM,8BAA8B,CAAC;AAChF,YAAY,EAAE,0BAA0B,EAAE,MAAM,6BAA6B,CAAC;AAC9E,YAAY,EAAE,wBAAwB,EAAE,MAAM,2BAA2B,CAAC;AAC1E,YAAY,EAAE,2BAA2B,EAAE,MAAM,8BAA8B,CAAC;AAChF,YAAY,EAAE,2BAA2B,EAAE,MAAM,8BAA8B,CAAC;AAChF,YAAY,EAAE,wBAAwB,EAAE,MAAM,2BAA2B,CAAC;AAC1E,YAAY,EAAE,0BAA0B,EAAE,MAAM,6BAA6B,CAAC;AAC9E,YAAY,EAAE,4BAA4B,EAAE,MAAM,+BAA+B,CAAC;AAClF,YAAY,EAAE,uBAAuB,EAAE,MAAM,0BAA0B,CAAC;AACxE,YAAY,EACV,OAAO,EACP,SAAS,EACT,aAAa,EACb,cAAc,EACd,KAAK,GACN,MAAM,sBAAsB,CAAC;AAC9B,YAAY,EACV,kBAAkB,EAClB,kBAAkB,EAClB,YAAY,GACb,MAAM,oBAAoB,CAAC;AAC5B,YAAY,EACV,gBAAgB,EAChB,oBAAoB,EACpB,YAAY,GACb,MAAM,8BAA8B,CAAC;AACtC,YAAY,EAAE,kBAAkB,EAAE,MAAM,2BAA2B,CAAC;AACpE,YAAY,EACV,yBAAyB,EACzB,aAAa,GACd,MAAM,iBAAiB,CAAC;AACzB,YAAY,EAAE,aAAa,EAAE,MAAM,YAAY,CAAC;AAEhD,MAAM,WAAW,qBAAqB,
|
|
1
|
+
{"version":3,"file":"types.d.ts","sourceRoot":"","sources":["../src/types.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,EAAE,WAAW,EAAE,MAAM,mBAAmB,CAAC;AACrD,OAAO,KAAK,EAAE,iBAAiB,EAAE,MAAM,2BAA2B,CAAC;AACnE,OAAO,KAAK,EAAE,aAAa,EAAE,KAAK,EAAE,MAAM,sBAAsB,CAAC;AAEjE,YAAY,EAAE,WAAW,EAAE,iBAAiB,EAAE,MAAM,mBAAmB,CAAC;AACxE,YAAY,EAAE,aAAa,EAAE,eAAe,EAAE,MAAM,eAAe,CAAC;AACpE,YAAY,EACV,gBAAgB,EAChB,2BAA2B,GAC5B,MAAM,yBAAyB,CAAC;AACjC,YAAY,EAAE,cAAc,EAAE,MAAM,eAAe,CAAC;AACpD,YAAY,EACV,aAAa,EACb,mBAAmB,GACpB,MAAM,2BAA2B,CAAC;AACnC,YAAY,EAAE,4BAA4B,EAAE,MAAM,+BAA+B,CAAC;AAClF,YAAY,EAAE,4BAA4B,EAAE,MAAM,+BAA+B,CAAC;AAClF,YAAY,EAAE,8BAA8B,EAAE,MAAM,iCAAiC,CAAC;AACtF,YAAY,EAAE,uBAAuB,EAAE,MAAM,0BAA0B,CAAC;AACxE,YAAY,EAAE,6BAA6B,EAAE,MAAM,iCAAiC,CAAC;AACrF,YAAY,EAAE,2BAA2B,EAAE,MAAM,8BAA8B,CAAC;AAChF,YAAY,EAAE,0BAA0B,EAAE,MAAM,6BAA6B,CAAC;AAC9E,YAAY,EAAE,wBAAwB,EAAE,MAAM,2BAA2B,CAAC;AAC1E,YAAY,EAAE,2BAA2B,EAAE,MAAM,8BAA8B,CAAC;AAChF,YAAY,EAAE,2BAA2B,EAAE,MAAM,8BAA8B,CAAC;AAChF,YAAY,EAAE,wBAAwB,EAAE,MAAM,2BAA2B,CAAC;AAC1E,YAAY,EAAE,0BAA0B,EAAE,MAAM,6BAA6B,CAAC;AAC9E,YAAY,EAAE,4BAA4B,EAAE,MAAM,+BAA+B,CAAC;AAClF,YAAY,EAAE,uBAAuB,EAAE,MAAM,0BAA0B,CAAC;AACxE,YAAY,EACV,OAAO,EACP,SAAS,EACT,aAAa,EACb,cAAc,EACd,KAAK,GACN,MAAM,sBAAsB,CAAC;AAC9B,YAAY,EACV,kBAAkB,EAClB,kBAAkB,EAClB,YAAY,GACb,MAAM,oBAAoB,CAAC;AAC5B,YAAY,EACV,gBAAgB,EAChB,oBAAoB,EACpB,YAAY,GACb,MAAM,8BAA8B,CAAC;AACtC,YAAY,EAAE,kBAAkB,EAAE,MAAM,2BAA2B,CAAC;AACpE,YAAY,EACV,yBAAyB,EACzB,aAAa,GACd,MAAM,iBAAiB,CAAC;AACzB,YAAY,EAAE,aAAa,EAAE,MAAM,YAAY,CAAC;AAEhD,MAAM,WAAW,qBAAqB,CACpC,CAAC,SAAS,KAAK,GAAG,KAAK,EACvB,CAAC,SAAS,MAAM,GAAG,aAAa,CAAC,CAAC,CAAC,GAAG,MAAM,GAAG,aAAa,CAAC,CAAC,CAAC;IAE/D,WAAW,CAAC,EAAE,WAAW,CAAC;IAC1B,MAAM,CAAC,EAAE,MAAM,CAAC;IAChB,OAAO,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,MAAM,CAAC,CAAC;IACjC,aAAa,CAAC,EAAE,MAAM,CAAC;IACvB,UAAU,CAAC,EAAE,MAAM,CAAC;IACpB,KAAK,EAAE,CAAC,CAAC;IAET,mBAAmB,CAAC,EAAE,MAAM,CAAC;IAC7B,MAAM,CAAC,EAAE,WAAW,CAAC;IACrB,cAAc,CAAC,EAAE,iBAAiB,CAAC,CAAC,CAAC,CAAC;IACtC,eAAe,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,CAAC;IAC1C,IAAI,EAAE,MAAM,CAAC;IACb,UAAU,CAAC,EAAE,OAAO,CAAC;IACrB,KAAK,EAAE,CAAC,CAAC;IACT,UAAU,CAAC,EAAE,MAAM,CAAC;CACrB"}
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"volume-adjust.d.ts","sourceRoot":"","sources":["../src/volume-adjust.ts"],"names":[],"mappings":"
|
|
1
|
+
{"version":3,"file":"volume-adjust.d.ts","sourceRoot":"","sources":["../src/volume-adjust.ts"],"names":[],"mappings":"AAQA,UAAU,iBAAiB;IACzB,QAAQ,CAAC,KAAK,EAAE,MAAM,GAAG,UAAU,CAAC;IACpC,QAAQ,CAAC,SAAS,EAAE,MAAM,CAAC;IAC3B,QAAQ,CAAC,UAAU,EAAE,MAAM,CAAC;CAC7B;AAED,wBAAsB,YAAY,CAChC,KAAK,EAAE,iBAAiB,GACvB,OAAO,CAAC,UAAU,CAAC,CAgBrB"}
|
package/dist/volume-adjust.js
CHANGED
|
@@ -1,21 +1,15 @@
|
|
|
1
|
-
import {
|
|
1
|
+
import { decodeAudioToPcm16 } from "./audio-decode.js";
|
|
2
|
+
import { base64ToUint8Array } from "./audio-utils.js";
|
|
3
|
+
import { concatPcmToWav, dbfsToInt16Rms, normalizeRms, } from "./conversation/pcm-concat.js";
|
|
2
4
|
export async function adjustVolume(input) {
|
|
3
5
|
const bytes = input.audio instanceof Uint8Array
|
|
4
6
|
? input.audio
|
|
5
7
|
: base64ToUint8Array(input.audio);
|
|
6
|
-
const segment =
|
|
8
|
+
const segment = await decodeAudioToPcm16(bytes, input.mediaType);
|
|
7
9
|
const [normalized] = normalizeRms([segment], dbfsToInt16Rms(input.volumeDbfs));
|
|
8
10
|
return await concatPcmToWav([normalized], {
|
|
9
11
|
gapMs: 0,
|
|
10
12
|
targetSampleRate: normalized.sampleRate,
|
|
11
13
|
});
|
|
12
14
|
}
|
|
13
|
-
function base64ToUint8Array(b64) {
|
|
14
|
-
const binaryString = atob(b64);
|
|
15
|
-
const out = new Uint8Array(binaryString.length);
|
|
16
|
-
for (let i = 0; i < binaryString.length; i++) {
|
|
17
|
-
out[i] = binaryString.charCodeAt(i);
|
|
18
|
-
}
|
|
19
|
-
return out;
|
|
20
|
-
}
|
|
21
15
|
//# sourceMappingURL=volume-adjust.js.map
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"volume-adjust.js","sourceRoot":"","sources":["../src/volume-adjust.ts"],"names":[],"mappings":"AAAA,OAAO,EACL,cAAc,EACd,cAAc,EACd,
|
|
1
|
+
{"version":3,"file":"volume-adjust.js","sourceRoot":"","sources":["../src/volume-adjust.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,kBAAkB,EAAE,MAAM,mBAAmB,CAAC;AACvD,OAAO,EAAE,kBAAkB,EAAE,MAAM,kBAAkB,CAAC;AACtD,OAAO,EACL,cAAc,EACd,cAAc,EACd,YAAY,GACb,MAAM,8BAA8B,CAAC;AAQtC,MAAM,CAAC,KAAK,UAAU,YAAY,CAChC,KAAwB;IAExB,MAAM,KAAK,GACT,KAAK,CAAC,KAAK,YAAY,UAAU;QAC/B,CAAC,CAAC,KAAK,CAAC,KAAK;QACb,CAAC,CAAC,kBAAkB,CAAC,KAAK,CAAC,KAAK,CAAC,CAAC;IAEtC,MAAM,OAAO,GAAG,MAAM,kBAAkB,CAAC,KAAK,EAAE,KAAK,CAAC,SAAS,CAAC,CAAC;IACjE,MAAM,CAAC,UAAU,CAAC,GAAG,YAAY,CAC/B,CAAC,OAAO,CAAC,EACT,cAAc,CAAC,KAAK,CAAC,UAAU,CAAC,CACjC,CAAC;IAEF,OAAO,MAAM,cAAc,CAAC,CAAC,UAAU,CAAC,EAAE;QACxC,KAAK,EAAE,CAAC;QACR,gBAAgB,EAAE,UAAU,CAAC,UAAU;KACxC,CAAC,CAAC;AACL,CAAC"}
|
package/package.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
{
|
|
2
2
|
"name": "@speech-sdk/core",
|
|
3
|
-
"version": "0.8.2
|
|
3
|
+
"version": "0.8.2",
|
|
4
4
|
"description": "Universal, cross-platform text-to-speech SDK with multi-provider support.",
|
|
5
5
|
"type": "module",
|
|
6
6
|
"main": "./dist/index.js",
|
|
@@ -17,13 +17,17 @@
|
|
|
17
17
|
"./types": {
|
|
18
18
|
"types": "./dist/types.d.ts",
|
|
19
19
|
"default": "./dist/types.js"
|
|
20
|
+
},
|
|
21
|
+
"./pronunciations": {
|
|
22
|
+
"types": "./dist/pronunciations/index.d.ts",
|
|
23
|
+
"default": "./dist/pronunciations/index.js"
|
|
20
24
|
}
|
|
21
25
|
},
|
|
22
26
|
"files": [
|
|
23
27
|
"dist",
|
|
24
|
-
"README.md"
|
|
25
|
-
"NOTICE"
|
|
28
|
+
"README.md"
|
|
26
29
|
],
|
|
30
|
+
"sideEffects": false,
|
|
27
31
|
"keywords": [
|
|
28
32
|
"tts",
|
|
29
33
|
"text-to-speech",
|
|
@@ -39,13 +43,13 @@
|
|
|
39
43
|
"url": "https://github.com/Jellypod-Inc/speech-sdk"
|
|
40
44
|
},
|
|
41
45
|
"dependencies": {
|
|
42
|
-
"@
|
|
46
|
+
"@mediabunny/mp3-encoder": "^1.42.0",
|
|
43
47
|
"mediabunny": "^1.40.1",
|
|
44
48
|
"p-retry": "^8.0.0",
|
|
45
49
|
"zod": "^4.3.6"
|
|
46
50
|
},
|
|
47
51
|
"devDependencies": {
|
|
48
|
-
"@biomejs/biome": "2.4.
|
|
52
|
+
"@biomejs/biome": "2.4.14",
|
|
49
53
|
"@types/node": "^25.5.0",
|
|
50
54
|
"dotenv": "^17.3.1",
|
|
51
55
|
"typescript": "^5.8.0",
|
package/NOTICE
DELETED
|
@@ -1,27 +0,0 @@
|
|
|
1
|
-
@speech-sdk/core
|
|
2
|
-
Copyright (c) Jellypod, Inc.
|
|
3
|
-
|
|
4
|
-
This product is licensed under the Apache License, Version 2.0 (see LICENSE).
|
|
5
|
-
|
|
6
|
-
It uses the following third-party software with separate license terms:
|
|
7
|
-
|
|
8
|
-
================================================================================
|
|
9
|
-
@breezystack/lamejs (LGPL-3.0-or-later)
|
|
10
|
-
================================================================================
|
|
11
|
-
|
|
12
|
-
MP3 encoding for `output: { format: "mp3" }` is performed by `@breezystack/lamejs`,
|
|
13
|
-
a JavaScript port of the LAME MP3 encoder.
|
|
14
|
-
|
|
15
|
-
- Package: https://www.npmjs.com/package/@breezystack/lamejs
|
|
16
|
-
- LAME: https://lame.sourceforge.net/
|
|
17
|
-
- License: GNU Lesser General Public License v3.0 or later
|
|
18
|
-
https://www.gnu.org/licenses/lgpl-3.0.html
|
|
19
|
-
|
|
20
|
-
`@speech-sdk/core` does not bundle, statically link, or modify lamejs. It is
|
|
21
|
-
declared as a regular npm dependency and loaded at runtime via dynamic
|
|
22
|
-
`import()` only when the caller requests MP3 output. End users receive lamejs
|
|
23
|
-
as a separate package in their `node_modules` tree and can substitute or
|
|
24
|
-
upgrade it via standard npm overrides.
|
|
25
|
-
|
|
26
|
-
If you modify the lamejs source you must release those modifications under the
|
|
27
|
-
LGPL, per the upstream license terms.
|