@speech-sdk/core 0.0.3 → 0.0.4
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +37 -0
- package/dist/audio-tags.d.ts +6 -0
- package/dist/audio-tags.d.ts.map +1 -0
- package/dist/audio-tags.js +17 -0
- package/dist/audio-tags.js.map +1 -0
- package/dist/errors.d.ts +1 -1
- package/dist/errors.d.ts.map +1 -1
- package/dist/errors.js +5 -5
- package/dist/errors.js.map +1 -1
- package/dist/generate-speech.d.ts +2 -2
- package/dist/generate-speech.d.ts.map +1 -1
- package/dist/generate-speech.js +29 -6
- package/dist/generate-speech.js.map +1 -1
- package/dist/index.d.ts +6 -5
- package/dist/index.d.ts.map +1 -1
- package/dist/index.js +4 -2
- package/dist/index.js.map +1 -1
- package/dist/provider-utils.d.ts.map +1 -1
- package/dist/provider-utils.js +16 -12
- package/dist/provider-utils.js.map +1 -1
- package/dist/providers/cartesia/index.d.ts +8 -1
- package/dist/providers/cartesia/index.d.ts.map +1 -1
- package/dist/providers/cartesia/index.js +160 -15
- package/dist/providers/cartesia/index.js.map +1 -1
- package/dist/providers/deepgram/index.d.ts +1 -1
- package/dist/providers/deepgram/index.d.ts.map +1 -1
- package/dist/providers/deepgram/index.js +16 -9
- package/dist/providers/deepgram/index.js.map +1 -1
- package/dist/providers/elevenlabs/index.d.ts +6 -1
- package/dist/providers/elevenlabs/index.d.ts.map +1 -1
- package/dist/providers/elevenlabs/index.js +167 -33
- package/dist/providers/elevenlabs/index.js.map +1 -1
- package/dist/providers/fal/index.d.ts +1 -1
- package/dist/providers/fal/index.d.ts.map +1 -1
- package/dist/providers/fal/index.js +52 -17
- package/dist/providers/fal/index.js.map +1 -1
- package/dist/providers/fish-audio/index.d.ts +1 -1
- package/dist/providers/fish-audio/index.d.ts.map +1 -1
- package/dist/providers/fish-audio/index.js +17 -10
- package/dist/providers/fish-audio/index.js.map +1 -1
- package/dist/providers/google/index.d.ts +1 -1
- package/dist/providers/google/index.d.ts.map +1 -1
- package/dist/providers/google/index.js +80 -15
- package/dist/providers/google/index.js.map +1 -1
- package/dist/providers/hume/index.d.ts +1 -1
- package/dist/providers/hume/index.d.ts.map +1 -1
- package/dist/providers/hume/index.js +43 -15
- package/dist/providers/hume/index.js.map +1 -1
- package/dist/providers/mistral/index.d.ts +1 -1
- package/dist/providers/mistral/index.d.ts.map +1 -1
- package/dist/providers/mistral/index.js +33 -16
- package/dist/providers/mistral/index.js.map +1 -1
- package/dist/providers/murf/index.d.ts +1 -1
- package/dist/providers/murf/index.d.ts.map +1 -1
- package/dist/providers/murf/index.js +62 -14
- package/dist/providers/murf/index.js.map +1 -1
- package/dist/providers/openai/index.d.ts +1 -1
- package/dist/providers/openai/index.d.ts.map +1 -1
- package/dist/providers/openai/index.js +99 -18
- package/dist/providers/openai/index.js.map +1 -1
- package/dist/providers/resemble/index.d.ts +1 -1
- package/dist/providers/resemble/index.d.ts.map +1 -1
- package/dist/providers/resemble/index.js +41 -10
- package/dist/providers/resemble/index.js.map +1 -1
- package/dist/providers/unreal-speech/index.d.ts +1 -1
- package/dist/providers/unreal-speech/index.d.ts.map +1 -1
- package/dist/providers/unreal-speech/index.js +20 -13
- package/dist/providers/unreal-speech/index.js.map +1 -1
- package/dist/resolve-provider.d.ts +1 -1
- package/dist/resolve-provider.d.ts.map +1 -1
- package/dist/resolve-provider.js +34 -34
- package/dist/resolve-provider.js.map +1 -1
- package/dist/speech-provider.d.ts +9 -5
- package/dist/speech-provider.d.ts.map +1 -1
- package/dist/speech-result.d.ts +4 -3
- package/dist/speech-result.d.ts.map +1 -1
- package/dist/speech-result.js +9 -7
- package/dist/speech-result.js.map +1 -1
- package/dist/types.d.ts +7 -7
- package/dist/types.d.ts.map +1 -1
- package/package.json +6 -2
|
@@ -1,27 +1,108 @@
|
|
|
1
|
-
import {
|
|
1
|
+
import { handleErrorResponse, resolveApiKey } from "../../provider-utils.js";
|
|
2
2
|
export class OpenAISpeechProvider {
|
|
3
|
-
id =
|
|
4
|
-
defaultModel =
|
|
3
|
+
id = "openai";
|
|
4
|
+
defaultModel = "gpt-4o-mini-tts";
|
|
5
5
|
static LANGUAGES = [
|
|
6
|
-
|
|
7
|
-
|
|
8
|
-
|
|
9
|
-
|
|
10
|
-
|
|
11
|
-
|
|
12
|
-
|
|
6
|
+
"af",
|
|
7
|
+
"ar",
|
|
8
|
+
"bg",
|
|
9
|
+
"bn",
|
|
10
|
+
"bs",
|
|
11
|
+
"ca",
|
|
12
|
+
"cs",
|
|
13
|
+
"cy",
|
|
14
|
+
"da",
|
|
15
|
+
"de",
|
|
16
|
+
"el",
|
|
17
|
+
"en",
|
|
18
|
+
"es",
|
|
19
|
+
"et",
|
|
20
|
+
"fi",
|
|
21
|
+
"fr",
|
|
22
|
+
"gl",
|
|
23
|
+
"gu",
|
|
24
|
+
"he",
|
|
25
|
+
"hi",
|
|
26
|
+
"hr",
|
|
27
|
+
"hu",
|
|
28
|
+
"id",
|
|
29
|
+
"is",
|
|
30
|
+
"it",
|
|
31
|
+
"ja",
|
|
32
|
+
"jv",
|
|
33
|
+
"ka",
|
|
34
|
+
"kk",
|
|
35
|
+
"km",
|
|
36
|
+
"kn",
|
|
37
|
+
"ko",
|
|
38
|
+
"lo",
|
|
39
|
+
"lt",
|
|
40
|
+
"lv",
|
|
41
|
+
"mk",
|
|
42
|
+
"ml",
|
|
43
|
+
"mn",
|
|
44
|
+
"mr",
|
|
45
|
+
"ms",
|
|
46
|
+
"my",
|
|
47
|
+
"ne",
|
|
48
|
+
"nl",
|
|
49
|
+
"no",
|
|
50
|
+
"pa",
|
|
51
|
+
"pl",
|
|
52
|
+
"pt",
|
|
53
|
+
"ro",
|
|
54
|
+
"ru",
|
|
55
|
+
"si",
|
|
56
|
+
"sk",
|
|
57
|
+
"sl",
|
|
58
|
+
"so",
|
|
59
|
+
"sq",
|
|
60
|
+
"sr",
|
|
61
|
+
"su",
|
|
62
|
+
"sv",
|
|
63
|
+
"sw",
|
|
64
|
+
"ta",
|
|
65
|
+
"te",
|
|
66
|
+
"th",
|
|
67
|
+
"tl",
|
|
68
|
+
"tr",
|
|
69
|
+
"uk",
|
|
70
|
+
"ur",
|
|
71
|
+
"vi",
|
|
72
|
+
"zh",
|
|
13
73
|
];
|
|
14
74
|
models = [
|
|
15
|
-
{
|
|
16
|
-
|
|
17
|
-
|
|
75
|
+
{
|
|
76
|
+
id: "gpt-4o-mini-tts",
|
|
77
|
+
languages: OpenAISpeechProvider.LANGUAGES,
|
|
78
|
+
releaseDate: "2025-03-20",
|
|
79
|
+
openSource: false,
|
|
80
|
+
inlineVoiceCloning: false,
|
|
81
|
+
zeroDataRetention: true,
|
|
82
|
+
},
|
|
83
|
+
{
|
|
84
|
+
id: "tts-1",
|
|
85
|
+
languages: OpenAISpeechProvider.LANGUAGES,
|
|
86
|
+
releaseDate: "2023-11-06",
|
|
87
|
+
openSource: false,
|
|
88
|
+
inlineVoiceCloning: false,
|
|
89
|
+
zeroDataRetention: true,
|
|
90
|
+
},
|
|
91
|
+
{
|
|
92
|
+
id: "tts-1-hd",
|
|
93
|
+
languages: OpenAISpeechProvider.LANGUAGES,
|
|
94
|
+
releaseDate: "2023-11-06",
|
|
95
|
+
openSource: false,
|
|
96
|
+
inlineVoiceCloning: false,
|
|
97
|
+
zeroDataRetention: true,
|
|
98
|
+
},
|
|
18
99
|
];
|
|
19
100
|
apiKey;
|
|
20
101
|
baseURL;
|
|
21
102
|
fetchFn;
|
|
22
103
|
constructor(config) {
|
|
23
104
|
this.apiKey = config.apiKey;
|
|
24
|
-
this.baseURL = config.baseURL ??
|
|
105
|
+
this.baseURL = config.baseURL ?? "https://api.openai.com/v1";
|
|
25
106
|
this.fetchFn = config.fetch ?? globalThis.fetch;
|
|
26
107
|
}
|
|
27
108
|
async generate(options) {
|
|
@@ -33,10 +114,10 @@ export class OpenAISpeechProvider {
|
|
|
33
114
|
};
|
|
34
115
|
const url = `${this.baseURL}/audio/speech`;
|
|
35
116
|
const response = await this.fetchFn(url, {
|
|
36
|
-
method:
|
|
117
|
+
method: "POST",
|
|
37
118
|
headers: {
|
|
38
|
-
|
|
39
|
-
|
|
119
|
+
"Content-Type": "application/json",
|
|
120
|
+
Authorization: `Bearer ${resolveApiKey(this.apiKey, "OPENAI_API_KEY", "OpenAI")}`,
|
|
40
121
|
...options.headers,
|
|
41
122
|
},
|
|
42
123
|
body: JSON.stringify(body),
|
|
@@ -44,7 +125,7 @@ export class OpenAISpeechProvider {
|
|
|
44
125
|
});
|
|
45
126
|
await handleErrorResponse(response, `openai/${options.modelId}`);
|
|
46
127
|
const arrayBuffer = await response.arrayBuffer();
|
|
47
|
-
const mediaType = response.headers.get(
|
|
128
|
+
const mediaType = response.headers.get("content-type") ?? "audio/mpeg";
|
|
48
129
|
return {
|
|
49
130
|
audio: new Uint8Array(arrayBuffer),
|
|
50
131
|
mediaType,
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"index.js","sourceRoot":"","sources":["../../../src/providers/openai/index.ts"],"names":[],"mappings":"
|
|
1
|
+
{"version":3,"file":"index.js","sourceRoot":"","sources":["../../../src/providers/openai/index.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,mBAAmB,EAAE,aAAa,EAAE,MAAM,yBAAyB,CAAC;AAS7E,MAAM,OAAO,oBAAoB;IACtB,EAAE,GAAG,QAAQ,CAAC;IACd,YAAY,GAAG,iBAAiB,CAAC;IAElC,MAAM,CAAU,SAAS,GAAG;QAClC,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;QACJ,IAAI;KACI,CAAC;IAEF,MAAM,GAAG;QAChB;YACE,EAAE,EAAE,iBAAiB;YACrB,SAAS,EAAE,oBAAoB,CAAC,SAAS;YACzC,WAAW,EAAE,YAAY;YACzB,UAAU,EAAE,KAAK;YACjB,kBAAkB,EAAE,KAAK;YACzB,iBAAiB,EAAE,IAAI;SACxB;QACD;YACE,EAAE,EAAE,OAAO;YACX,SAAS,EAAE,oBAAoB,CAAC,SAAS;YACzC,WAAW,EAAE,YAAY;YACzB,UAAU,EAAE,KAAK;YACjB,kBAAkB,EAAE,KAAK;YACzB,iBAAiB,EAAE,IAAI;SACxB;QACD;YACE,EAAE,EAAE,UAAU;YACd,SAAS,EAAE,oBAAoB,CAAC,SAAS;YACzC,WAAW,EAAE,YAAY;YACzB,UAAU,EAAE,KAAK;YACjB,kBAAkB,EAAE,KAAK;YACzB,iBAAiB,EAAE,IAAI;SACxB;KACO,CAAC;IAEM,MAAM,CAAqB;IAC3B,OAAO,CAAS;IAChB,OAAO,CAA0B;IAElD,YAAY,MAAkC;QAC5C,IAAI,CAAC,MAAM,GAAG,MAAM,CAAC,MAAM,CAAC;QAC5B,IAAI,CAAC,OAAO,GAAG,MAAM,CAAC,OAAO,IAAI,2BAA2B,CAAC;QAC7D,IAAI,CAAC,OAAO,GAAG,MAAM,CAAC,KAAK,IAAI,UAAU,CAAC,KAAK,CAAC;IAClD,CAAC;IAED,KAAK,CAAC,QAAQ,CAAC,OAOd;QAKC,MAAM,IAAI,GAA4B;YACpC,GAAG,OAAO,CAAC,eAAe;YAC1B,KAAK,EAAE,OAAO,CAAC,OAAO;YACtB,KAAK,EAAE,OAAO,CAAC,IAAI;YACnB,KAAK,EAAE,OAAO,CAAC,KAAK;SACrB,CAAC;QAEF,MAAM,GAAG,GAAG,GAAG,IAAI,CAAC,OAAO,eAAe,CAAC;QAE3C,MAAM,QAAQ,GAAG,MAAM,IAAI,CAAC,OAAO,CAAC,GAAG,EAAE;YACvC,MAAM,EAAE,MAAM;YACd,OAAO,EAAE;gBACP,cAAc,EAAE,kBAAkB;gBAClC,aAAa,EAAE,UAAU,aAAa,CAAC,IAAI,CAAC,MAAM,EAAE,gBAAgB,EAAE,QAAQ,CAAC,EAAE;gBACjF,GAAG,OAAO,CAAC,OAAO;aACnB;YACD,IAAI,EAAE,IAAI,CAAC,SAAS,CAAC,IAAI,CAAC;YAC1B,MAAM,EAAE,OAAO,CAAC,WAAW;SAC5B,CAAC,CAAC;QAEH,MAAM,mBAAmB,CAAC,QAAQ,EAAE,UAAU,OAAO,CAAC,OAAO,EAAE,CAAC,CAAC;QAEjE,MAAM,WAAW,GAAG,MAAM,QAAQ,CAAC,WAAW,EAAE,CAAC;QACjD,MAAM,SAAS,GAAG,QAAQ,CAAC,OAAO,CAAC,GAAG,CAAC,cAAc,CAAC,IAAI,YAAY,CAAC;QAEvE,OAAO;YACL,KAAK,EAAE,IAAI,UAAU,CAAC,WAAW,CAAC;YAClC,SAAS;SACV,CAAC;IACJ,CAAC;;AAGH,MAAM,UAAU,YAAY,CAAC,SAAqC,EAAE;IAClE,MAAM,QAAQ,GAAG,IAAI,oBAAoB,CAAC,MAAM,CAAC,CAAC;IAElD,OAAO,SAAS,MAAM,CAAC,OAAgB;QACrC,OAAO;YACL,QAAQ;YACR,OAAO,EAAE,OAAO,IAAI,QAAQ,CAAC,YAAY;SAC1C,CAAC;IACJ,CAAC,CAAC;AACJ,CAAC"}
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"index.d.ts","sourceRoot":"","sources":["../../../src/providers/resemble/index.ts"],"names":[],"mappings":"
|
|
1
|
+
{"version":3,"file":"index.d.ts","sourceRoot":"","sources":["../../../src/providers/resemble/index.ts"],"names":[],"mappings":"AACA,OAAO,KAAK,EAAE,aAAa,EAAE,cAAc,EAAE,MAAM,0BAA0B,CAAC;AAE9E,MAAM,WAAW,4BAA4B;IAC3C,MAAM,CAAC,EAAE,MAAM,CAAC;IAChB,OAAO,CAAC,EAAE,MAAM,CAAC;IACjB,KAAK,CAAC,EAAE,OAAO,UAAU,CAAC,KAAK,CAAC;CACjC;AAED,qBAAa,sBAAuB,YAAW,cAAc,CAAC,MAAM,EAAE,MAAM,CAAC;IAC3E,QAAQ,CAAC,EAAE,cAAc;IACzB,QAAQ,CAAC,YAAY,aAAa;IAElC,QAAQ,CAAC,MAAM;;;;;;;OAiCJ;IAEX,OAAO,CAAC,QAAQ,CAAC,MAAM,CAAqB;IAC5C,OAAO,CAAC,QAAQ,CAAC,OAAO,CAAS;IACjC,OAAO,CAAC,QAAQ,CAAC,OAAO,CAA0B;gBAEtC,MAAM,EAAE,4BAA4B;IAM1C,QAAQ,CAAC,OAAO,EAAE;QACtB,OAAO,EAAE,MAAM,CAAC;QAChB,IAAI,EAAE,MAAM,CAAC;QACb,KAAK,CAAC,EAAE,MAAM,CAAC;QACf,eAAe,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,CAAC;QAC1C,WAAW,CAAC,EAAE,WAAW,CAAC;QAC1B,OAAO,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,MAAM,CAAC,CAAC;KAClC,GAAG,OAAO,CAAC;QACV,KAAK,EAAE,MAAM,CAAC;QACd,SAAS,EAAE,MAAM,CAAC;QAClB,gBAAgB,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,CAAC;KAC5C,CAAC;CAiCH;AAED,wBAAgB,cAAc,CAAC,MAAM,GAAE,4BAAiC,IAG7C,UAAU,MAAM,KAAG,aAAa,CAAC,MAAM,CAAC,CAMlE"}
|
|
@@ -1,16 +1,47 @@
|
|
|
1
|
-
import {
|
|
1
|
+
import { handleErrorResponse, resolveApiKey } from "../../provider-utils.js";
|
|
2
2
|
export class ResembleSpeechProvider {
|
|
3
|
-
id =
|
|
4
|
-
defaultModel =
|
|
3
|
+
id = "resemble";
|
|
4
|
+
defaultModel = "default";
|
|
5
5
|
models = [
|
|
6
|
-
{
|
|
6
|
+
{
|
|
7
|
+
id: "default",
|
|
8
|
+
languages: [
|
|
9
|
+
"en",
|
|
10
|
+
"ar",
|
|
11
|
+
"da",
|
|
12
|
+
"de",
|
|
13
|
+
"el",
|
|
14
|
+
"es",
|
|
15
|
+
"fi",
|
|
16
|
+
"fr",
|
|
17
|
+
"he",
|
|
18
|
+
"hi",
|
|
19
|
+
"it",
|
|
20
|
+
"ja",
|
|
21
|
+
"ko",
|
|
22
|
+
"ms",
|
|
23
|
+
"nl",
|
|
24
|
+
"no",
|
|
25
|
+
"pl",
|
|
26
|
+
"pt",
|
|
27
|
+
"ru",
|
|
28
|
+
"sv",
|
|
29
|
+
"sw",
|
|
30
|
+
"tr",
|
|
31
|
+
"zh",
|
|
32
|
+
],
|
|
33
|
+
releaseDate: "2025-09-04",
|
|
34
|
+
openSource: true,
|
|
35
|
+
inlineVoiceCloning: true,
|
|
36
|
+
zeroDataRetention: false,
|
|
37
|
+
},
|
|
7
38
|
];
|
|
8
39
|
apiKey;
|
|
9
40
|
baseURL;
|
|
10
41
|
fetchFn;
|
|
11
42
|
constructor(config) {
|
|
12
43
|
this.apiKey = config.apiKey;
|
|
13
|
-
this.baseURL = config.baseURL ??
|
|
44
|
+
this.baseURL = config.baseURL ?? "https://f.cluster.resemble.ai";
|
|
14
45
|
this.fetchFn = config.fetch ?? globalThis.fetch;
|
|
15
46
|
}
|
|
16
47
|
async generate(options) {
|
|
@@ -21,20 +52,20 @@ export class ResembleSpeechProvider {
|
|
|
21
52
|
data: options.text,
|
|
22
53
|
};
|
|
23
54
|
const response = await this.fetchFn(url, {
|
|
24
|
-
method:
|
|
55
|
+
method: "POST",
|
|
25
56
|
headers: {
|
|
26
|
-
|
|
27
|
-
|
|
57
|
+
"Content-Type": "application/json",
|
|
58
|
+
Authorization: resolveApiKey(this.apiKey, "RESEMBLE_API_KEY", "Resemble"),
|
|
28
59
|
...options.headers,
|
|
29
60
|
},
|
|
30
61
|
body: JSON.stringify(body),
|
|
31
62
|
signal: options.abortSignal,
|
|
32
63
|
});
|
|
33
64
|
await handleErrorResponse(response, `resemble/${options.modelId}`);
|
|
34
|
-
const json = await response.json();
|
|
65
|
+
const json = (await response.json());
|
|
35
66
|
return {
|
|
36
67
|
audio: json.audio_content,
|
|
37
|
-
mediaType:
|
|
68
|
+
mediaType: "audio/wav",
|
|
38
69
|
};
|
|
39
70
|
}
|
|
40
71
|
}
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"index.js","sourceRoot":"","sources":["../../../src/providers/resemble/index.ts"],"names":[],"mappings":"
|
|
1
|
+
{"version":3,"file":"index.js","sourceRoot":"","sources":["../../../src/providers/resemble/index.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,mBAAmB,EAAE,aAAa,EAAE,MAAM,yBAAyB,CAAC;AAS7E,MAAM,OAAO,sBAAsB;IACxB,EAAE,GAAG,UAAU,CAAC;IAChB,YAAY,GAAG,SAAS,CAAC;IAEzB,MAAM,GAAG;QAChB;YACE,EAAE,EAAE,SAAS;YACb,SAAS,EAAE;gBACT,IAAI;gBACJ,IAAI;gBACJ,IAAI;gBACJ,IAAI;gBACJ,IAAI;gBACJ,IAAI;gBACJ,IAAI;gBACJ,IAAI;gBACJ,IAAI;gBACJ,IAAI;gBACJ,IAAI;gBACJ,IAAI;gBACJ,IAAI;gBACJ,IAAI;gBACJ,IAAI;gBACJ,IAAI;gBACJ,IAAI;gBACJ,IAAI;gBACJ,IAAI;gBACJ,IAAI;gBACJ,IAAI;gBACJ,IAAI;gBACJ,IAAI;aACL;YACD,WAAW,EAAE,YAAY;YACzB,UAAU,EAAE,IAAI;YAChB,kBAAkB,EAAE,IAAI;YACxB,iBAAiB,EAAE,KAAK;SACzB;KACO,CAAC;IAEM,MAAM,CAAqB;IAC3B,OAAO,CAAS;IAChB,OAAO,CAA0B;IAElD,YAAY,MAAoC;QAC9C,IAAI,CAAC,MAAM,GAAG,MAAM,CAAC,MAAM,CAAC;QAC5B,IAAI,CAAC,OAAO,GAAG,MAAM,CAAC,OAAO,IAAI,+BAA+B,CAAC;QACjE,IAAI,CAAC,OAAO,GAAG,MAAM,CAAC,KAAK,IAAI,UAAU,CAAC,KAAK,CAAC;IAClD,CAAC;IAED,KAAK,CAAC,QAAQ,CAAC,OAOd;QAKC,MAAM,GAAG,GAAG,GAAG,IAAI,CAAC,OAAO,aAAa,CAAC;QAEzC,MAAM,IAAI,GAA4B;YACpC,GAAG,OAAO,CAAC,eAAe;YAC1B,UAAU,EAAE,OAAO,CAAC,KAAK;YACzB,IAAI,EAAE,OAAO,CAAC,IAAI;SACnB,CAAC;QAEF,MAAM,QAAQ,GAAG,MAAM,IAAI,CAAC,OAAO,CAAC,GAAG,EAAE;YACvC,MAAM,EAAE,MAAM;YACd,OAAO,EAAE;gBACP,cAAc,EAAE,kBAAkB;gBAClC,aAAa,EAAE,aAAa,CAC1B,IAAI,CAAC,MAAM,EACX,kBAAkB,EAClB,UAAU,CACX;gBACD,GAAG,OAAO,CAAC,OAAO;aACnB;YACD,IAAI,EAAE,IAAI,CAAC,SAAS,CAAC,IAAI,CAAC;YAC1B,MAAM,EAAE,OAAO,CAAC,WAAW;SAC5B,CAAC,CAAC;QAEH,MAAM,mBAAmB,CAAC,QAAQ,EAAE,YAAY,OAAO,CAAC,OAAO,EAAE,CAAC,CAAC;QAEnE,MAAM,IAAI,GAAG,CAAC,MAAM,QAAQ,CAAC,IAAI,EAAE,CAA8B,CAAC;QAElE,OAAO;YACL,KAAK,EAAE,IAAI,CAAC,aAAa;YACzB,SAAS,EAAE,WAAW;SACvB,CAAC;IACJ,CAAC;CACF;AAED,MAAM,UAAU,cAAc,CAAC,SAAuC,EAAE;IACtE,MAAM,QAAQ,GAAG,IAAI,sBAAsB,CAAC,MAAM,CAAC,CAAC;IAEpD,OAAO,SAAS,QAAQ,CAAC,OAAgB;QACvC,OAAO;YACL,QAAQ;YACR,OAAO,EAAE,OAAO,IAAI,QAAQ,CAAC,YAAY;SAC1C,CAAC;IACJ,CAAC,CAAC;AACJ,CAAC"}
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"index.d.ts","sourceRoot":"","sources":["../../../src/providers/unreal-speech/index.ts"],"names":[],"mappings":"
|
|
1
|
+
{"version":3,"file":"index.d.ts","sourceRoot":"","sources":["../../../src/providers/unreal-speech/index.ts"],"names":[],"mappings":"AAEA,OAAO,KAAK,EAAE,aAAa,EAAE,cAAc,EAAE,MAAM,0BAA0B,CAAC;AAE9E,MAAM,WAAW,0BAA0B;IACzC,MAAM,CAAC,EAAE,MAAM,CAAC;IAChB,OAAO,CAAC,EAAE,MAAM,CAAC;IACjB,KAAK,CAAC,EAAE,OAAO,UAAU,CAAC,KAAK,CAAC;CACjC;AAED,qBAAa,oBAAqB,YAAW,cAAc,CAAC,MAAM,EAAE,MAAM,CAAC;IACzE,QAAQ,CAAC,EAAE,mBAAmB;IAC9B,QAAQ,CAAC,YAAY,aAAa;IAElC,QAAQ,CAAC,MAAM;;;;;;;OASJ;IAEX,OAAO,CAAC,QAAQ,CAAC,MAAM,CAAqB;IAC5C,OAAO,CAAC,QAAQ,CAAC,OAAO,CAAS;IACjC,OAAO,CAAC,QAAQ,CAAC,OAAO,CAA0B;gBAEtC,MAAM,EAAE,0BAA0B;IAMxC,QAAQ,CAAC,OAAO,EAAE;QACtB,OAAO,EAAE,MAAM,CAAC;QAChB,IAAI,EAAE,MAAM,CAAC;QACb,KAAK,CAAC,EAAE,MAAM,CAAC;QACf,eAAe,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,CAAC;QAC1C,WAAW,CAAC,EAAE,WAAW,CAAC;QAC1B,OAAO,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,MAAM,CAAC,CAAC;KAClC,GAAG,OAAO,CAAC;QACV,KAAK,EAAE,UAAU,CAAC;QAClB,SAAS,EAAE,MAAM,CAAC;QAClB,gBAAgB,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,CAAC;KAC5C,CAAC;CA6CH;AAED,wBAAgB,kBAAkB,CAAC,MAAM,GAAE,0BAA+B,IAG3C,UAAU,MAAM,KAAG,aAAa,CAAC,MAAM,CAAC,CAMtE"}
|
|
@@ -1,40 +1,47 @@
|
|
|
1
|
-
import {
|
|
2
|
-
import {
|
|
1
|
+
import { ApiError } from "../../errors.js";
|
|
2
|
+
import { handleErrorResponse, resolveApiKey } from "../../provider-utils.js";
|
|
3
3
|
export class UnrealSpeechProvider {
|
|
4
|
-
id =
|
|
5
|
-
defaultModel =
|
|
4
|
+
id = "unreal-speech";
|
|
5
|
+
defaultModel = "default";
|
|
6
6
|
models = [
|
|
7
|
-
{
|
|
7
|
+
{
|
|
8
|
+
id: "default",
|
|
9
|
+
languages: ["en", "zh", "hi", "es", "pt", "ja", "fr", "it"],
|
|
10
|
+
releaseDate: "2025-06-01",
|
|
11
|
+
openSource: false,
|
|
12
|
+
inlineVoiceCloning: false,
|
|
13
|
+
zeroDataRetention: false,
|
|
14
|
+
},
|
|
8
15
|
];
|
|
9
16
|
apiKey;
|
|
10
17
|
baseURL;
|
|
11
18
|
fetchFn;
|
|
12
19
|
constructor(config) {
|
|
13
20
|
this.apiKey = config.apiKey;
|
|
14
|
-
this.baseURL = config.baseURL ??
|
|
21
|
+
this.baseURL = config.baseURL ?? "https://api.v8.unrealspeech.com";
|
|
15
22
|
this.fetchFn = config.fetch ?? globalThis.fetch;
|
|
16
23
|
}
|
|
17
24
|
async generate(options) {
|
|
18
25
|
const url = `${this.baseURL}/speech`;
|
|
19
26
|
const body = {
|
|
20
27
|
...options.providerOptions,
|
|
21
|
-
AudioFormat:
|
|
22
|
-
OutputFormat:
|
|
28
|
+
AudioFormat: "mp3",
|
|
29
|
+
OutputFormat: "uri",
|
|
23
30
|
VoiceId: options.voice,
|
|
24
31
|
Text: options.text,
|
|
25
32
|
};
|
|
26
33
|
const response = await this.fetchFn(url, {
|
|
27
|
-
method:
|
|
34
|
+
method: "POST",
|
|
28
35
|
headers: {
|
|
29
|
-
|
|
30
|
-
|
|
36
|
+
"Content-Type": "application/json",
|
|
37
|
+
Authorization: `Bearer ${resolveApiKey(this.apiKey, "UNREAL_SPEECH_API_KEY", "Unreal Speech")}`,
|
|
31
38
|
...options.headers,
|
|
32
39
|
},
|
|
33
40
|
body: JSON.stringify(body),
|
|
34
41
|
signal: options.abortSignal,
|
|
35
42
|
});
|
|
36
43
|
await handleErrorResponse(response, `unreal-speech/${options.modelId}`);
|
|
37
|
-
const json = await response.json();
|
|
44
|
+
const json = (await response.json());
|
|
38
45
|
const audioResponse = await this.fetchFn(json.OutputUri, {
|
|
39
46
|
signal: options.abortSignal,
|
|
40
47
|
});
|
|
@@ -48,7 +55,7 @@ export class UnrealSpeechProvider {
|
|
|
48
55
|
const arrayBuffer = await audioResponse.arrayBuffer();
|
|
49
56
|
return {
|
|
50
57
|
audio: new Uint8Array(arrayBuffer),
|
|
51
|
-
mediaType:
|
|
58
|
+
mediaType: "audio/mpeg",
|
|
52
59
|
};
|
|
53
60
|
}
|
|
54
61
|
}
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"index.js","sourceRoot":"","sources":["../../../src/providers/unreal-speech/index.ts"],"names":[],"mappings":"
|
|
1
|
+
{"version":3,"file":"index.js","sourceRoot":"","sources":["../../../src/providers/unreal-speech/index.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,QAAQ,EAAE,MAAM,iBAAiB,CAAC;AAC3C,OAAO,EAAE,mBAAmB,EAAE,aAAa,EAAE,MAAM,yBAAyB,CAAC;AAS7E,MAAM,OAAO,oBAAoB;IACtB,EAAE,GAAG,eAAe,CAAC;IACrB,YAAY,GAAG,SAAS,CAAC;IAEzB,MAAM,GAAG;QAChB;YACE,EAAE,EAAE,SAAS;YACb,SAAS,EAAE,CAAC,IAAI,EAAE,IAAI,EAAE,IAAI,EAAE,IAAI,EAAE,IAAI,EAAE,IAAI,EAAE,IAAI,EAAE,IAAI,CAAC;YAC3D,WAAW,EAAE,YAAY;YACzB,UAAU,EAAE,KAAK;YACjB,kBAAkB,EAAE,KAAK;YACzB,iBAAiB,EAAE,KAAK;SACzB;KACO,CAAC;IAEM,MAAM,CAAqB;IAC3B,OAAO,CAAS;IAChB,OAAO,CAA0B;IAElD,YAAY,MAAkC;QAC5C,IAAI,CAAC,MAAM,GAAG,MAAM,CAAC,MAAM,CAAC;QAC5B,IAAI,CAAC,OAAO,GAAG,MAAM,CAAC,OAAO,IAAI,iCAAiC,CAAC;QACnE,IAAI,CAAC,OAAO,GAAG,MAAM,CAAC,KAAK,IAAI,UAAU,CAAC,KAAK,CAAC;IAClD,CAAC;IAED,KAAK,CAAC,QAAQ,CAAC,OAOd;QAKC,MAAM,GAAG,GAAG,GAAG,IAAI,CAAC,OAAO,SAAS,CAAC;QAErC,MAAM,IAAI,GAA4B;YACpC,GAAG,OAAO,CAAC,eAAe;YAC1B,WAAW,EAAE,KAAK;YAClB,YAAY,EAAE,KAAK;YACnB,OAAO,EAAE,OAAO,CAAC,KAAK;YACtB,IAAI,EAAE,OAAO,CAAC,IAAI;SACnB,CAAC;QAEF,MAAM,QAAQ,GAAG,MAAM,IAAI,CAAC,OAAO,CAAC,GAAG,EAAE;YACvC,MAAM,EAAE,MAAM;YACd,OAAO,EAAE;gBACP,cAAc,EAAE,kBAAkB;gBAClC,aAAa,EAAE,UAAU,aAAa,CAAC,IAAI,CAAC,MAAM,EAAE,uBAAuB,EAAE,eAAe,CAAC,EAAE;gBAC/F,GAAG,OAAO,CAAC,OAAO;aACnB;YACD,IAAI,EAAE,IAAI,CAAC,SAAS,CAAC,IAAI,CAAC;YAC1B,MAAM,EAAE,OAAO,CAAC,WAAW;SAC5B,CAAC,CAAC;QAEH,MAAM,mBAAmB,CAAC,QAAQ,EAAE,iBAAiB,OAAO,CAAC,OAAO,EAAE,CAAC,CAAC;QAExE,MAAM,IAAI,GAAG,CAAC,MAAM,QAAQ,CAAC,IAAI,EAAE,CAA0B,CAAC;QAE9D,MAAM,aAAa,GAAG,MAAM,IAAI,CAAC,OAAO,CAAC,IAAI,CAAC,SAAS,EAAE;YACvD,MAAM,EAAE,OAAO,CAAC,WAAW;SAC5B,CAAC,CAAC;QAEH,IAAI,CAAC,aAAa,CAAC,EAAE,EAAE,CAAC;YACtB,MAAM,IAAI,QAAQ,CAAC,cAAc,aAAa,CAAC,MAAM,EAAE,EAAE;gBACvD,UAAU,EAAE,aAAa,CAAC,MAAM;gBAChC,KAAK,EAAE,iBAAiB,OAAO,CAAC,OAAO,EAAE;gBACzC,YAAY,EAAE,MAAM,aAAa,CAAC,IAAI,EAAE,CAAC,KAAK,CAAC,GAAG,EAAE,CAAC,SAAS,CAAC;aAChE,CAAC,CAAC;QACL,CAAC;QAED,MAAM,WAAW,GAAG,MAAM,aAAa,CAAC,WAAW,EAAE,CAAC;QAEtD,OAAO;YACL,KAAK,EAAE,IAAI,UAAU,CAAC,WAAW,CAAC;YAClC,SAAS,EAAE,YAAY;SACxB,CAAC;IACJ,CAAC;CACF;AAED,MAAM,UAAU,kBAAkB,CAAC,SAAqC,EAAE;IACxE,MAAM,QAAQ,GAAG,IAAI,oBAAoB,CAAC,MAAM,CAAC,CAAC;IAElD,OAAO,SAAS,YAAY,CAAC,OAAgB;QAC3C,OAAO;YACL,QAAQ;YACR,OAAO,EAAE,OAAO,IAAI,QAAQ,CAAC,YAAY;SAC1C,CAAC;IACJ,CAAC,CAAC;AACJ,CAAC"}
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"resolve-provider.d.ts","sourceRoot":"","sources":["../src/resolve-provider.ts"],"names":[],"mappings":"
|
|
1
|
+
{"version":3,"file":"resolve-provider.d.ts","sourceRoot":"","sources":["../src/resolve-provider.ts"],"names":[],"mappings":"AAaA,OAAO,KAAK,EAAE,aAAa,EAAkB,MAAM,sBAAsB,CAAC;AA0C1E,wBAAgB,YAAY,CAAC,KAAK,EAAE,MAAM,GAAG,aAAa,GAAG,aAAa,CAsBzE"}
|
package/dist/resolve-provider.js
CHANGED
|
@@ -1,47 +1,47 @@
|
|
|
1
|
-
import { SpeechSDKError } from
|
|
2
|
-
import {
|
|
3
|
-
import {
|
|
4
|
-
import {
|
|
5
|
-
import {
|
|
6
|
-
import {
|
|
7
|
-
import { GoogleSpeechProvider } from
|
|
8
|
-
import {
|
|
9
|
-
import {
|
|
10
|
-
import { MurfSpeechProvider } from
|
|
11
|
-
import {
|
|
12
|
-
import {
|
|
13
|
-
import {
|
|
1
|
+
import { SpeechSDKError } from "./errors.js";
|
|
2
|
+
import { CartesiaSpeechProvider } from "./providers/cartesia/index.js";
|
|
3
|
+
import { DeepgramSpeechProvider } from "./providers/deepgram/index.js";
|
|
4
|
+
import { ElevenLabsSpeechProvider } from "./providers/elevenlabs/index.js";
|
|
5
|
+
import { FalSpeechProvider } from "./providers/fal/index.js";
|
|
6
|
+
import { FishAudioSpeechProvider } from "./providers/fish-audio/index.js";
|
|
7
|
+
import { GoogleSpeechProvider } from "./providers/google/index.js";
|
|
8
|
+
import { HumeSpeechProvider } from "./providers/hume/index.js";
|
|
9
|
+
import { MistralSpeechProvider } from "./providers/mistral/index.js";
|
|
10
|
+
import { MurfSpeechProvider } from "./providers/murf/index.js";
|
|
11
|
+
import { OpenAISpeechProvider } from "./providers/openai/index.js";
|
|
12
|
+
import { ResembleSpeechProvider } from "./providers/resemble/index.js";
|
|
13
|
+
import { UnrealSpeechProvider } from "./providers/unreal-speech/index.js";
|
|
14
14
|
function isResolvedModel(model) {
|
|
15
15
|
return (model != null &&
|
|
16
|
-
typeof model ===
|
|
17
|
-
|
|
18
|
-
|
|
16
|
+
typeof model === "object" &&
|
|
17
|
+
"provider" in model &&
|
|
18
|
+
"modelId" in model);
|
|
19
19
|
}
|
|
20
20
|
function createBuiltinProvider(name) {
|
|
21
21
|
switch (name) {
|
|
22
|
-
case
|
|
22
|
+
case "openai":
|
|
23
23
|
return new OpenAISpeechProvider({});
|
|
24
|
-
case
|
|
24
|
+
case "elevenlabs":
|
|
25
25
|
return new ElevenLabsSpeechProvider({});
|
|
26
|
-
case
|
|
26
|
+
case "deepgram":
|
|
27
27
|
return new DeepgramSpeechProvider({});
|
|
28
|
-
case
|
|
28
|
+
case "cartesia":
|
|
29
29
|
return new CartesiaSpeechProvider({});
|
|
30
|
-
case
|
|
30
|
+
case "hume":
|
|
31
31
|
return new HumeSpeechProvider({});
|
|
32
|
-
case
|
|
32
|
+
case "google":
|
|
33
33
|
return new GoogleSpeechProvider({});
|
|
34
|
-
case
|
|
34
|
+
case "fish-audio":
|
|
35
35
|
return new FishAudioSpeechProvider({});
|
|
36
|
-
case
|
|
36
|
+
case "unreal-speech":
|
|
37
37
|
return new UnrealSpeechProvider({});
|
|
38
|
-
case
|
|
38
|
+
case "murf":
|
|
39
39
|
return new MurfSpeechProvider({});
|
|
40
|
-
case
|
|
40
|
+
case "resemble":
|
|
41
41
|
return new ResembleSpeechProvider({});
|
|
42
|
-
case
|
|
42
|
+
case "fal-ai":
|
|
43
43
|
return new FalSpeechProvider({});
|
|
44
|
-
case
|
|
44
|
+
case "mistral":
|
|
45
45
|
return new MistralSpeechProvider({});
|
|
46
46
|
default:
|
|
47
47
|
throw new SpeechSDKError(`Unknown provider: ${name}`);
|
|
@@ -51,17 +51,17 @@ export function resolveModel(model) {
|
|
|
51
51
|
if (isResolvedModel(model)) {
|
|
52
52
|
return model;
|
|
53
53
|
}
|
|
54
|
-
const slashIndex = model.indexOf(
|
|
54
|
+
const slashIndex = model.indexOf("/");
|
|
55
55
|
let providerName;
|
|
56
56
|
let modelId;
|
|
57
|
-
if (slashIndex
|
|
58
|
-
providerName = model.slice(0, slashIndex);
|
|
59
|
-
modelId = model.slice(slashIndex + 1);
|
|
60
|
-
}
|
|
61
|
-
else {
|
|
57
|
+
if (slashIndex === -1) {
|
|
62
58
|
providerName = model;
|
|
63
59
|
modelId = undefined;
|
|
64
60
|
}
|
|
61
|
+
else {
|
|
62
|
+
providerName = model.slice(0, slashIndex);
|
|
63
|
+
modelId = model.slice(slashIndex + 1);
|
|
64
|
+
}
|
|
65
65
|
const provider = createBuiltinProvider(providerName);
|
|
66
66
|
return {
|
|
67
67
|
provider,
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"resolve-provider.js","sourceRoot":"","sources":["../src/resolve-provider.ts"],"names":[],"mappings":"
|
|
1
|
+
{"version":3,"file":"resolve-provider.js","sourceRoot":"","sources":["../src/resolve-provider.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,cAAc,EAAE,MAAM,aAAa,CAAC;AAC7C,OAAO,EAAE,sBAAsB,EAAE,MAAM,+BAA+B,CAAC;AACvE,OAAO,EAAE,sBAAsB,EAAE,MAAM,+BAA+B,CAAC;AACvE,OAAO,EAAE,wBAAwB,EAAE,MAAM,iCAAiC,CAAC;AAC3E,OAAO,EAAE,iBAAiB,EAAE,MAAM,0BAA0B,CAAC;AAC7D,OAAO,EAAE,uBAAuB,EAAE,MAAM,iCAAiC,CAAC;AAC1E,OAAO,EAAE,oBAAoB,EAAE,MAAM,6BAA6B,CAAC;AACnE,OAAO,EAAE,kBAAkB,EAAE,MAAM,2BAA2B,CAAC;AAC/D,OAAO,EAAE,qBAAqB,EAAE,MAAM,8BAA8B,CAAC;AACrE,OAAO,EAAE,kBAAkB,EAAE,MAAM,2BAA2B,CAAC;AAC/D,OAAO,EAAE,oBAAoB,EAAE,MAAM,6BAA6B,CAAC;AACnE,OAAO,EAAE,sBAAsB,EAAE,MAAM,+BAA+B,CAAC;AACvE,OAAO,EAAE,oBAAoB,EAAE,MAAM,oCAAoC,CAAC;AAG1E,SAAS,eAAe,CAAC,KAAc;IACrC,OAAO,CACL,KAAK,IAAI,IAAI;QACb,OAAO,KAAK,KAAK,QAAQ;QACzB,UAAU,IAAI,KAAK;QACnB,SAAS,IAAI,KAAK,CACnB,CAAC;AACJ,CAAC;AAED,SAAS,qBAAqB,CAAC,IAAY;IACzC,QAAQ,IAAI,EAAE,CAAC;QACb,KAAK,QAAQ;YACX,OAAO,IAAI,oBAAoB,CAAC,EAAE,CAAC,CAAC;QACtC,KAAK,YAAY;YACf,OAAO,IAAI,wBAAwB,CAAC,EAAE,CAAC,CAAC;QAC1C,KAAK,UAAU;YACb,OAAO,IAAI,sBAAsB,CAAC,EAAE,CAAC,CAAC;QACxC,KAAK,UAAU;YACb,OAAO,IAAI,sBAAsB,CAAC,EAAE,CAAC,CAAC;QACxC,KAAK,MAAM;YACT,OAAO,IAAI,kBAAkB,CAAC,EAAE,CAAC,CAAC;QACpC,KAAK,QAAQ;YACX,OAAO,IAAI,oBAAoB,CAAC,EAAE,CAAC,CAAC;QACtC,KAAK,YAAY;YACf,OAAO,IAAI,uBAAuB,CAAC,EAAE,CAAC,CAAC;QACzC,KAAK,eAAe;YAClB,OAAO,IAAI,oBAAoB,CAAC,EAAE,CAAC,CAAC;QACtC,KAAK,MAAM;YACT,OAAO,IAAI,kBAAkB,CAAC,EAAE,CAAC,CAAC;QACpC,KAAK,UAAU;YACb,OAAO,IAAI,sBAAsB,CAAC,EAAE,CAAC,CAAC;QACxC,KAAK,QAAQ;YACX,OAAO,IAAI,iBAAiB,CAAC,EAAE,CAAC,CAAC;QACnC,KAAK,SAAS;YACZ,OAAO,IAAI,qBAAqB,CAAC,EAAE,CAAC,CAAC;QACvC;YACE,MAAM,IAAI,cAAc,CAAC,qBAAqB,IAAI,EAAE,CAAC,CAAC;IAC1D,CAAC;AACH,CAAC;AAED,MAAM,UAAU,YAAY,CAAC,KAA6B;IACxD,IAAI,eAAe,CAAC,KAAK,CAAC,EAAE,CAAC;QAC3B,OAAO,KAAK,CAAC;IACf,CAAC;IAED,MAAM,UAAU,GAAG,KAAK,CAAC,OAAO,CAAC,GAAG,CAAC,CAAC;IACtC,IAAI,YAAoB,CAAC;IACzB,IAAI,OAA2B,CAAC;IAEhC,IAAI,UAAU,KAAK,CAAC,CAAC,EAAE,CAAC;QACtB,YAAY,GAAG,KAAK,CAAC;QACrB,OAAO,GAAG,SAAS,CAAC;IACtB,CAAC;SAAM,CAAC;QACN,YAAY,GAAG,KAAK,CAAC,KAAK,CAAC,CAAC,EAAE,UAAU,CAAC,CAAC;QAC1C,OAAO,GAAG,KAAK,CAAC,KAAK,CAAC,UAAU,GAAG,CAAC,CAAC,CAAC;IACxC,CAAC;IAED,MAAM,QAAQ,GAAG,qBAAqB,CAAC,YAAY,CAAC,CAAC;IACrD,OAAO;QACL,QAAQ;QACR,OAAO,EAAE,OAAO,IAAI,QAAQ,CAAC,YAAY;KAC1C,CAAC;AACJ,CAAC"}
|
|
@@ -5,16 +5,14 @@ export type Voice = string | {
|
|
|
5
5
|
};
|
|
6
6
|
export interface ModelInfo {
|
|
7
7
|
id: string;
|
|
8
|
+
inlineVoiceCloning: boolean;
|
|
8
9
|
languages: readonly string[];
|
|
9
|
-
releaseDate: string;
|
|
10
10
|
openSource: boolean;
|
|
11
|
-
|
|
11
|
+
releaseDate: string;
|
|
12
12
|
zeroDataRetention: boolean;
|
|
13
13
|
}
|
|
14
14
|
export interface SpeechProvider<TModel extends string = string, TVoice extends Voice = Voice> {
|
|
15
|
-
id: string;
|
|
16
15
|
defaultModel: TModel;
|
|
17
|
-
models: readonly ModelInfo[];
|
|
18
16
|
generate(options: {
|
|
19
17
|
modelId: string;
|
|
20
18
|
text: string;
|
|
@@ -27,9 +25,15 @@ export interface SpeechProvider<TModel extends string = string, TVoice extends V
|
|
|
27
25
|
mediaType: string;
|
|
28
26
|
providerMetadata?: Record<string, unknown>;
|
|
29
27
|
}>;
|
|
28
|
+
id: string;
|
|
29
|
+
models: readonly ModelInfo[];
|
|
30
|
+
processAudioTags?(text: string, modelId: string): {
|
|
31
|
+
text: string;
|
|
32
|
+
warnings: string[];
|
|
33
|
+
};
|
|
30
34
|
}
|
|
31
35
|
export interface ResolvedModel<TVoice extends Voice = Voice> {
|
|
32
|
-
provider: SpeechProvider<string, TVoice>;
|
|
33
36
|
modelId: string;
|
|
37
|
+
provider: SpeechProvider<string, TVoice>;
|
|
34
38
|
}
|
|
35
39
|
//# sourceMappingURL=speech-provider.d.ts.map
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"speech-provider.d.ts","sourceRoot":"","sources":["../src/speech-provider.ts"],"names":[],"mappings":"AAAA,MAAM,MAAM,KAAK,
|
|
1
|
+
{"version":3,"file":"speech-provider.d.ts","sourceRoot":"","sources":["../src/speech-provider.ts"],"names":[],"mappings":"AAAA,MAAM,MAAM,KAAK,GAAG,MAAM,GAAG;IAAE,GAAG,EAAE,MAAM,CAAA;CAAE,GAAG;IAAE,KAAK,EAAE,MAAM,GAAG,UAAU,CAAA;CAAE,CAAC;AAE9E,MAAM,WAAW,SAAS;IACxB,EAAE,EAAE,MAAM,CAAC;IACX,kBAAkB,EAAE,OAAO,CAAC;IAC5B,SAAS,EAAE,SAAS,MAAM,EAAE,CAAC;IAC7B,UAAU,EAAE,OAAO,CAAC;IACpB,WAAW,EAAE,MAAM,CAAC;IACpB,iBAAiB,EAAE,OAAO,CAAC;CAC5B;AAED,MAAM,WAAW,cAAc,CAC7B,MAAM,SAAS,MAAM,GAAG,MAAM,EAC9B,MAAM,SAAS,KAAK,GAAG,KAAK;IAE5B,YAAY,EAAE,MAAM,CAAC;IAErB,QAAQ,CAAC,OAAO,EAAE;QAChB,OAAO,EAAE,MAAM,CAAC;QAChB,IAAI,EAAE,MAAM,CAAC;QACb,KAAK,CAAC,EAAE,MAAM,CAAC;QACf,eAAe,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,CAAC;QAC1C,WAAW,CAAC,EAAE,WAAW,CAAC;QAC1B,OAAO,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,MAAM,CAAC,CAAC;KAClC,GAAG,OAAO,CAAC;QACV,KAAK,EAAE,MAAM,GAAG,UAAU,CAAC;QAC3B,SAAS,EAAE,MAAM,CAAC;QAClB,gBAAgB,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,CAAC;KAC5C,CAAC,CAAC;IACH,EAAE,EAAE,MAAM,CAAC;IACX,MAAM,EAAE,SAAS,SAAS,EAAE,CAAC;IAE7B,gBAAgB,CAAC,CACf,IAAI,EAAE,MAAM,EACZ,OAAO,EAAE,MAAM,GACd;QAAE,IAAI,EAAE,MAAM,CAAC;QAAC,QAAQ,EAAE,MAAM,EAAE,CAAA;KAAE,CAAC;CACzC;AAED,MAAM,WAAW,aAAa,CAAC,MAAM,SAAS,KAAK,GAAG,KAAK;IACzD,OAAO,EAAE,MAAM,CAAC;IAChB,QAAQ,EAAE,cAAc,CAAC,MAAM,EAAE,MAAM,CAAC,CAAC;CAC1C"}
|
package/dist/speech-result.d.ts
CHANGED
|
@@ -1,18 +1,19 @@
|
|
|
1
1
|
export interface GeneratedAudioFile {
|
|
2
|
-
readonly uint8Array: Uint8Array;
|
|
3
2
|
readonly base64: string;
|
|
4
3
|
readonly mediaType: string;
|
|
4
|
+
readonly uint8Array: Uint8Array;
|
|
5
5
|
}
|
|
6
6
|
export interface SpeechResult {
|
|
7
7
|
readonly audio: GeneratedAudioFile;
|
|
8
8
|
readonly providerMetadata?: Record<string, unknown>;
|
|
9
|
+
readonly warnings?: string[];
|
|
9
10
|
}
|
|
10
11
|
export declare class DefaultGeneratedAudioFile implements GeneratedAudioFile {
|
|
11
12
|
readonly mediaType: string;
|
|
12
|
-
private _data;
|
|
13
|
+
private readonly _data;
|
|
13
14
|
private _uint8Array?;
|
|
14
15
|
private _base64?;
|
|
15
|
-
constructor({ data, mediaType }: {
|
|
16
|
+
constructor({ data, mediaType, }: {
|
|
16
17
|
data: string | Uint8Array;
|
|
17
18
|
mediaType: string;
|
|
18
19
|
});
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"speech-result.d.ts","sourceRoot":"","sources":["../src/speech-result.ts"],"names":[],"mappings":"AAAA,MAAM,WAAW,kBAAkB;IACjC,QAAQ,CAAC,
|
|
1
|
+
{"version":3,"file":"speech-result.d.ts","sourceRoot":"","sources":["../src/speech-result.ts"],"names":[],"mappings":"AAAA,MAAM,WAAW,kBAAkB;IACjC,QAAQ,CAAC,MAAM,EAAE,MAAM,CAAC;IACxB,QAAQ,CAAC,SAAS,EAAE,MAAM,CAAC;IAC3B,QAAQ,CAAC,UAAU,EAAE,UAAU,CAAC;CACjC;AAED,MAAM,WAAW,YAAY;IAC3B,QAAQ,CAAC,KAAK,EAAE,kBAAkB,CAAC;IACnC,QAAQ,CAAC,gBAAgB,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,CAAC;IACpD,QAAQ,CAAC,QAAQ,CAAC,EAAE,MAAM,EAAE,CAAC;CAC9B;AAED,qBAAa,yBAA0B,YAAW,kBAAkB;IAClE,QAAQ,CAAC,SAAS,EAAE,MAAM,CAAC;IAE3B,OAAO,CAAC,QAAQ,CAAC,KAAK,CAAsB;IAC5C,OAAO,CAAC,WAAW,CAAC,CAAa;IACjC,OAAO,CAAC,OAAO,CAAC,CAAS;gBAEb,EACV,IAAI,EACJ,SAAS,GACV,EAAE;QAAE,IAAI,EAAE,MAAM,GAAG,UAAU,CAAC;QAAC,SAAS,EAAE,MAAM,CAAA;KAAE;IAKnD,IAAI,UAAU,IAAI,UAAU,CAe3B;IAED,IAAI,MAAM,IAAI,MAAM,CAcnB;CACF"}
|
package/dist/speech-result.js
CHANGED
|
@@ -3,13 +3,14 @@ export class DefaultGeneratedAudioFile {
|
|
|
3
3
|
_data;
|
|
4
4
|
_uint8Array;
|
|
5
5
|
_base64;
|
|
6
|
-
constructor({ data, mediaType }) {
|
|
6
|
+
constructor({ data, mediaType, }) {
|
|
7
7
|
this._data = data;
|
|
8
8
|
this.mediaType = mediaType;
|
|
9
9
|
}
|
|
10
10
|
get uint8Array() {
|
|
11
|
-
if (this._uint8Array != null)
|
|
11
|
+
if (this._uint8Array != null) {
|
|
12
12
|
return this._uint8Array;
|
|
13
|
+
}
|
|
13
14
|
if (this._data instanceof Uint8Array) {
|
|
14
15
|
this._uint8Array = this._data;
|
|
15
16
|
}
|
|
@@ -24,15 +25,16 @@ export class DefaultGeneratedAudioFile {
|
|
|
24
25
|
return this._uint8Array;
|
|
25
26
|
}
|
|
26
27
|
get base64() {
|
|
27
|
-
if (this._base64 != null)
|
|
28
|
+
if (this._base64 != null) {
|
|
28
29
|
return this._base64;
|
|
29
|
-
|
|
30
|
+
}
|
|
31
|
+
if (typeof this._data === "string") {
|
|
30
32
|
this._base64 = this._data;
|
|
31
33
|
}
|
|
32
34
|
else {
|
|
33
|
-
let binaryString =
|
|
34
|
-
for (
|
|
35
|
-
binaryString += String.fromCharCode(
|
|
35
|
+
let binaryString = "";
|
|
36
|
+
for (const byte of this._data) {
|
|
37
|
+
binaryString += String.fromCharCode(byte);
|
|
36
38
|
}
|
|
37
39
|
this._base64 = btoa(binaryString);
|
|
38
40
|
}
|
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"speech-result.js","sourceRoot":"","sources":["../src/speech-result.ts"],"names":[],"mappings":"
|
|
1
|
+
{"version":3,"file":"speech-result.js","sourceRoot":"","sources":["../src/speech-result.ts"],"names":[],"mappings":"AAYA,MAAM,OAAO,yBAAyB;IAC3B,SAAS,CAAS;IAEV,KAAK,CAAsB;IACpC,WAAW,CAAc;IACzB,OAAO,CAAU;IAEzB,YAAY,EACV,IAAI,EACJ,SAAS,GACwC;QACjD,IAAI,CAAC,KAAK,GAAG,IAAI,CAAC;QAClB,IAAI,CAAC,SAAS,GAAG,SAAS,CAAC;IAC7B,CAAC;IAED,IAAI,UAAU;QACZ,IAAI,IAAI,CAAC,WAAW,IAAI,IAAI,EAAE,CAAC;YAC7B,OAAO,IAAI,CAAC,WAAW,CAAC;QAC1B,CAAC;QACD,IAAI,IAAI,CAAC,KAAK,YAAY,UAAU,EAAE,CAAC;YACrC,IAAI,CAAC,WAAW,GAAG,IAAI,CAAC,KAAK,CAAC;QAChC,CAAC;aAAM,CAAC;YACN,MAAM,YAAY,GAAG,IAAI,CAAC,IAAI,CAAC,KAAK,CAAC,CAAC;YACtC,MAAM,KAAK,GAAG,IAAI,UAAU,CAAC,YAAY,CAAC,MAAM,CAAC,CAAC;YAClD,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,GAAG,YAAY,CAAC,MAAM,EAAE,CAAC,EAAE,EAAE,CAAC;gBAC7C,KAAK,CAAC,CAAC,CAAC,GAAG,YAAY,CAAC,UAAU,CAAC,CAAC,CAAC,CAAC;YACxC,CAAC;YACD,IAAI,CAAC,WAAW,GAAG,KAAK,CAAC;QAC3B,CAAC;QACD,OAAO,IAAI,CAAC,WAAW,CAAC;IAC1B,CAAC;IAED,IAAI,MAAM;QACR,IAAI,IAAI,CAAC,OAAO,IAAI,IAAI,EAAE,CAAC;YACzB,OAAO,IAAI,CAAC,OAAO,CAAC;QACtB,CAAC;QACD,IAAI,OAAO,IAAI,CAAC,KAAK,KAAK,QAAQ,EAAE,CAAC;YACnC,IAAI,CAAC,OAAO,GAAG,IAAI,CAAC,KAAK,CAAC;QAC5B,CAAC;aAAM,CAAC;YACN,IAAI,YAAY,GAAG,EAAE,CAAC;YACtB,KAAK,MAAM,IAAI,IAAI,IAAI,CAAC,KAAK,EAAE,CAAC;gBAC9B,YAAY,IAAI,MAAM,CAAC,YAAY,CAAC,IAAI,CAAC,CAAC;YAC5C,CAAC;YACD,IAAI,CAAC,OAAO,GAAG,IAAI,CAAC,YAAY,CAAC,CAAC;QACpC,CAAC;QACD,OAAO,IAAI,CAAC,OAAO,CAAC;IACtB,CAAC;CACF"}
|