voice-router-dev 0.2.7 → 0.2.8
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/index.d.mts +1 -1
- package/dist/index.d.ts +1 -1
- package/dist/index.js +72 -72
- package/dist/index.js.map +1 -1
- package/dist/index.mjs +72 -72
- package/dist/index.mjs.map +1 -1
- package/package.json +1 -1
package/dist/index.mjs
CHANGED
|
@@ -1983,7 +1983,7 @@ var GladiaAdapter = class extends BaseAdapter {
|
|
|
1983
1983
|
}))
|
|
1984
1984
|
);
|
|
1985
1985
|
return extractWords(allWords, (item) => ({
|
|
1986
|
-
|
|
1986
|
+
word: item.word.word,
|
|
1987
1987
|
start: item.word.start,
|
|
1988
1988
|
end: item.word.end,
|
|
1989
1989
|
confidence: item.word.confidence,
|
|
@@ -2003,11 +2003,11 @@ var GladiaAdapter = class extends BaseAdapter {
|
|
|
2003
2003
|
end: utterance.end,
|
|
2004
2004
|
speaker: utterance.speaker?.toString(),
|
|
2005
2005
|
confidence: utterance.confidence,
|
|
2006
|
-
words: utterance.words.map((
|
|
2007
|
-
|
|
2008
|
-
start:
|
|
2009
|
-
end:
|
|
2010
|
-
confidence:
|
|
2006
|
+
words: utterance.words.map((w) => ({
|
|
2007
|
+
word: w.word,
|
|
2008
|
+
start: w.start,
|
|
2009
|
+
end: w.end,
|
|
2010
|
+
confidence: w.confidence
|
|
2011
2011
|
}))
|
|
2012
2012
|
}));
|
|
2013
2013
|
}
|
|
@@ -2139,11 +2139,11 @@ var GladiaAdapter = class extends BaseAdapter {
|
|
|
2139
2139
|
text: utterance.text,
|
|
2140
2140
|
isFinal: messageData.is_final,
|
|
2141
2141
|
confidence: utterance.confidence,
|
|
2142
|
-
words: utterance.words.map((
|
|
2143
|
-
|
|
2144
|
-
start:
|
|
2145
|
-
end:
|
|
2146
|
-
confidence:
|
|
2142
|
+
words: utterance.words.map((w) => ({
|
|
2143
|
+
word: w.word,
|
|
2144
|
+
start: w.start,
|
|
2145
|
+
end: w.end,
|
|
2146
|
+
confidence: w.confidence
|
|
2147
2147
|
})),
|
|
2148
2148
|
data: message
|
|
2149
2149
|
});
|
|
@@ -2157,11 +2157,11 @@ var GladiaAdapter = class extends BaseAdapter {
|
|
|
2157
2157
|
end: utterance.end,
|
|
2158
2158
|
speaker: utterance.speaker?.toString(),
|
|
2159
2159
|
confidence: utterance.confidence,
|
|
2160
|
-
words: utterance.words.map((
|
|
2161
|
-
|
|
2162
|
-
start:
|
|
2163
|
-
end:
|
|
2164
|
-
confidence:
|
|
2160
|
+
words: utterance.words.map((w) => ({
|
|
2161
|
+
word: w.word,
|
|
2162
|
+
start: w.start,
|
|
2163
|
+
end: w.end,
|
|
2164
|
+
confidence: w.confidence
|
|
2165
2165
|
}))
|
|
2166
2166
|
};
|
|
2167
2167
|
callbacks?.onUtterance?.(utteranceData);
|
|
@@ -2866,14 +2866,14 @@ var AssemblyAIAdapter = class extends BaseAdapter {
|
|
|
2866
2866
|
if (!transcript.words || transcript.words.length === 0) {
|
|
2867
2867
|
return void 0;
|
|
2868
2868
|
}
|
|
2869
|
-
return transcript.words.map((
|
|
2870
|
-
|
|
2871
|
-
start:
|
|
2869
|
+
return transcript.words.map((w) => ({
|
|
2870
|
+
word: w.text,
|
|
2871
|
+
start: w.start / 1e3,
|
|
2872
2872
|
// Convert ms to seconds
|
|
2873
|
-
end:
|
|
2873
|
+
end: w.end / 1e3,
|
|
2874
2874
|
// Convert ms to seconds
|
|
2875
|
-
confidence:
|
|
2876
|
-
speaker:
|
|
2875
|
+
confidence: w.confidence,
|
|
2876
|
+
speaker: w.speaker || void 0
|
|
2877
2877
|
}));
|
|
2878
2878
|
}
|
|
2879
2879
|
/**
|
|
@@ -2891,11 +2891,11 @@ var AssemblyAIAdapter = class extends BaseAdapter {
|
|
|
2891
2891
|
// Convert ms to seconds
|
|
2892
2892
|
speaker: utterance.speaker || void 0,
|
|
2893
2893
|
confidence: utterance.confidence,
|
|
2894
|
-
words: utterance.words.map((
|
|
2895
|
-
|
|
2896
|
-
start:
|
|
2897
|
-
end:
|
|
2898
|
-
confidence:
|
|
2894
|
+
words: utterance.words.map((w) => ({
|
|
2895
|
+
word: w.text,
|
|
2896
|
+
start: w.start / 1e3,
|
|
2897
|
+
end: w.end / 1e3,
|
|
2898
|
+
confidence: w.confidence
|
|
2899
2899
|
}))
|
|
2900
2900
|
}));
|
|
2901
2901
|
}
|
|
@@ -2988,12 +2988,12 @@ var AssemblyAIAdapter = class extends BaseAdapter {
|
|
|
2988
2988
|
text: turnMsg.transcript,
|
|
2989
2989
|
isFinal: turnMsg.end_of_turn,
|
|
2990
2990
|
confidence: turnMsg.end_of_turn_confidence,
|
|
2991
|
-
words: turnMsg.words.map((
|
|
2992
|
-
|
|
2993
|
-
start:
|
|
2991
|
+
words: turnMsg.words.map((w) => ({
|
|
2992
|
+
word: w.text,
|
|
2993
|
+
start: w.start / 1e3,
|
|
2994
2994
|
// Convert ms to seconds
|
|
2995
|
-
end:
|
|
2996
|
-
confidence:
|
|
2995
|
+
end: w.end / 1e3,
|
|
2996
|
+
confidence: w.confidence
|
|
2997
2997
|
})),
|
|
2998
2998
|
data: turnMsg
|
|
2999
2999
|
});
|
|
@@ -3352,11 +3352,11 @@ var DeepgramAdapter = class extends BaseAdapter {
|
|
|
3352
3352
|
return void 0;
|
|
3353
3353
|
}
|
|
3354
3354
|
return alternative.words.map(
|
|
3355
|
-
(
|
|
3356
|
-
|
|
3357
|
-
start:
|
|
3358
|
-
end:
|
|
3359
|
-
confidence:
|
|
3355
|
+
(w) => ({
|
|
3356
|
+
word: w.word || "",
|
|
3357
|
+
start: w.start || 0,
|
|
3358
|
+
end: w.end || 0,
|
|
3359
|
+
confidence: w.confidence,
|
|
3360
3360
|
speaker: void 0
|
|
3361
3361
|
// Speaker info is at utterance level, not word level
|
|
3362
3362
|
})
|
|
@@ -3376,11 +3376,11 @@ var DeepgramAdapter = class extends BaseAdapter {
|
|
|
3376
3376
|
end: utterance.end || 0,
|
|
3377
3377
|
speaker: utterance.speaker?.toString(),
|
|
3378
3378
|
confidence: utterance.confidence,
|
|
3379
|
-
words: utterance.words?.map((
|
|
3380
|
-
|
|
3381
|
-
start:
|
|
3382
|
-
end:
|
|
3383
|
-
confidence:
|
|
3379
|
+
words: utterance.words?.map((w) => ({
|
|
3380
|
+
word: w.word || "",
|
|
3381
|
+
start: w.start || 0,
|
|
3382
|
+
end: w.end || 0,
|
|
3383
|
+
confidence: w.confidence
|
|
3384
3384
|
}))
|
|
3385
3385
|
}));
|
|
3386
3386
|
}
|
|
@@ -3471,11 +3471,11 @@ var DeepgramAdapter = class extends BaseAdapter {
|
|
|
3471
3471
|
if (channel) {
|
|
3472
3472
|
const transcript = channel.transcript;
|
|
3473
3473
|
const isFinal = message.is_final;
|
|
3474
|
-
const words = channel.words?.map((
|
|
3475
|
-
|
|
3476
|
-
start:
|
|
3477
|
-
end:
|
|
3478
|
-
confidence:
|
|
3474
|
+
const words = channel.words?.map((w) => ({
|
|
3475
|
+
word: w.word,
|
|
3476
|
+
start: w.start,
|
|
3477
|
+
end: w.end,
|
|
3478
|
+
confidence: w.confidence
|
|
3479
3479
|
}));
|
|
3480
3480
|
callbacks?.onTranscript?.({
|
|
3481
3481
|
type: "transcript",
|
|
@@ -3816,12 +3816,12 @@ var AzureSTTAdapter = class extends BaseAdapter {
|
|
|
3816
3816
|
const recognizedPhrases = transcriptionData.recognizedPhrases || [];
|
|
3817
3817
|
const fullText = combinedPhrases.map((phrase) => phrase.display || phrase.lexical).join(" ") || "";
|
|
3818
3818
|
const words = recognizedPhrases.flatMap(
|
|
3819
|
-
(phrase) => (phrase.nBest?.[0]?.words || []).map((
|
|
3820
|
-
|
|
3821
|
-
start:
|
|
3819
|
+
(phrase) => (phrase.nBest?.[0]?.words || []).map((w) => ({
|
|
3820
|
+
word: w.word,
|
|
3821
|
+
start: w.offsetInTicks / 1e7,
|
|
3822
3822
|
// Convert ticks to seconds
|
|
3823
|
-
end: (
|
|
3824
|
-
confidence:
|
|
3823
|
+
end: (w.offsetInTicks + w.durationInTicks) / 1e7,
|
|
3824
|
+
confidence: w.confidence,
|
|
3825
3825
|
speaker: phrase.speaker !== void 0 ? phrase.speaker.toString() : void 0
|
|
3826
3826
|
}))
|
|
3827
3827
|
);
|
|
@@ -4102,10 +4102,10 @@ var OpenAIWhisperAdapter = class extends BaseAdapter {
|
|
|
4102
4102
|
}
|
|
4103
4103
|
if ("duration" in response && "language" in response) {
|
|
4104
4104
|
const verboseResponse = response;
|
|
4105
|
-
const words = verboseResponse.words?.map((
|
|
4106
|
-
|
|
4107
|
-
start:
|
|
4108
|
-
end:
|
|
4105
|
+
const words = verboseResponse.words?.map((w) => ({
|
|
4106
|
+
word: w.word,
|
|
4107
|
+
start: w.start,
|
|
4108
|
+
end: w.end,
|
|
4109
4109
|
confidence: void 0
|
|
4110
4110
|
}));
|
|
4111
4111
|
const requestId2 = `openai-${Date.now()}`;
|
|
@@ -4371,7 +4371,7 @@ var SpeechmaticsAdapter = class extends BaseAdapter {
|
|
|
4371
4371
|
normalizeResponse(response) {
|
|
4372
4372
|
const text = response.results.filter((r) => r.type === "word" && r.alternatives).map((r) => r.alternatives[0]?.content || "").join(" ");
|
|
4373
4373
|
const words = response.results.filter((r) => r.type === "word" && r.start_time !== void 0 && r.end_time !== void 0).map((result) => ({
|
|
4374
|
-
|
|
4374
|
+
word: result.alternatives?.[0]?.content || "",
|
|
4375
4375
|
start: result.start_time,
|
|
4376
4376
|
end: result.end_time,
|
|
4377
4377
|
confidence: result.alternatives?.[0]?.confidence,
|
|
@@ -4522,12 +4522,12 @@ var GladiaWebhookHandler = class extends BaseWebhookHandler {
|
|
|
4522
4522
|
/**
|
|
4523
4523
|
* Convert Gladia WordDTO to unified Word type
|
|
4524
4524
|
*/
|
|
4525
|
-
mapWord(
|
|
4525
|
+
mapWord(w) {
|
|
4526
4526
|
return {
|
|
4527
|
-
|
|
4528
|
-
start:
|
|
4529
|
-
end:
|
|
4530
|
-
confidence:
|
|
4527
|
+
word: w.word,
|
|
4528
|
+
start: w.start,
|
|
4529
|
+
end: w.end,
|
|
4530
|
+
confidence: w.confidence
|
|
4531
4531
|
};
|
|
4532
4532
|
}
|
|
4533
4533
|
/**
|
|
@@ -4865,11 +4865,11 @@ var DeepgramWebhookHandler = class extends BaseWebhookHandler {
|
|
|
4865
4865
|
raw: payload
|
|
4866
4866
|
};
|
|
4867
4867
|
}
|
|
4868
|
-
const words = alternative.words && alternative.words.length > 0 ? alternative.words.map((
|
|
4869
|
-
|
|
4870
|
-
start:
|
|
4871
|
-
end:
|
|
4872
|
-
confidence:
|
|
4868
|
+
const words = alternative.words && alternative.words.length > 0 ? alternative.words.map((w) => ({
|
|
4869
|
+
word: w.word || "",
|
|
4870
|
+
start: w.start || 0,
|
|
4871
|
+
end: w.end || 0,
|
|
4872
|
+
confidence: w.confidence
|
|
4873
4873
|
})) : void 0;
|
|
4874
4874
|
const speakers = response.results.utterances && response.results.utterances.length > 0 ? response.results.utterances.map((utterance) => ({
|
|
4875
4875
|
id: utterance.speaker?.toString() || "unknown",
|
|
@@ -4883,11 +4883,11 @@ var DeepgramWebhookHandler = class extends BaseWebhookHandler {
|
|
|
4883
4883
|
end: utterance.end || 0,
|
|
4884
4884
|
speaker: utterance.speaker?.toString(),
|
|
4885
4885
|
confidence: utterance.confidence,
|
|
4886
|
-
words: utterance.words && utterance.words.length > 0 ? utterance.words.map((
|
|
4887
|
-
|
|
4888
|
-
start:
|
|
4889
|
-
end:
|
|
4890
|
-
confidence:
|
|
4886
|
+
words: utterance.words && utterance.words.length > 0 ? utterance.words.map((w) => ({
|
|
4887
|
+
word: w.word || "",
|
|
4888
|
+
start: w.start || 0,
|
|
4889
|
+
end: w.end || 0,
|
|
4890
|
+
confidence: w.confidence
|
|
4891
4891
|
})) : void 0
|
|
4892
4892
|
})) : void 0;
|
|
4893
4893
|
const summary = alternative.summaries?.[0]?.summary;
|