@speech-sdk/core 0.0.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +185 -0
- package/dist/errors.d.ts +20 -0
- package/dist/errors.d.ts.map +1 -0
- package/dist/errors.js +25 -0
- package/dist/errors.js.map +1 -0
- package/dist/generate-speech.d.ts +12 -0
- package/dist/generate-speech.d.ts.map +1 -0
- package/dist/generate-speech.js +39 -0
- package/dist/generate-speech.js.map +1 -0
- package/dist/index.d.ts +6 -0
- package/dist/index.d.ts.map +1 -0
- package/dist/index.js +3 -0
- package/dist/index.js.map +1 -0
- package/dist/provider-utils.d.ts +3 -0
- package/dist/provider-utils.d.ts.map +1 -0
- package/dist/provider-utils.js +49 -0
- package/dist/provider-utils.js.map +1 -0
- package/dist/providers/cartesia/index.d.ts +35 -0
- package/dist/providers/cartesia/index.d.ts.map +1 -0
- package/dist/providers/cartesia/index.js +59 -0
- package/dist/providers/cartesia/index.js.map +1 -0
- package/dist/providers/deepgram/index.d.ts +32 -0
- package/dist/providers/deepgram/index.d.ts.map +1 -0
- package/dist/providers/deepgram/index.js +53 -0
- package/dist/providers/deepgram/index.js.map +1 -0
- package/dist/providers/elevenlabs/elevenlabs-options.d.ts +2 -0
- package/dist/providers/elevenlabs/elevenlabs-options.d.ts.map +1 -0
- package/dist/providers/elevenlabs/elevenlabs-options.js +2 -0
- package/dist/providers/elevenlabs/elevenlabs-options.js.map +1 -0
- package/dist/providers/elevenlabs/elevenlabs-provider.d.ts +5 -0
- package/dist/providers/elevenlabs/elevenlabs-provider.d.ts.map +1 -0
- package/dist/providers/elevenlabs/elevenlabs-provider.js +11 -0
- package/dist/providers/elevenlabs/elevenlabs-provider.js.map +1 -0
- package/dist/providers/elevenlabs/elevenlabs-speech-model.d.ts +44 -0
- package/dist/providers/elevenlabs/elevenlabs-speech-model.d.ts.map +1 -0
- package/dist/providers/elevenlabs/elevenlabs-speech-model.js +82 -0
- package/dist/providers/elevenlabs/elevenlabs-speech-model.js.map +1 -0
- package/dist/providers/elevenlabs/index.d.ts +44 -0
- package/dist/providers/elevenlabs/index.d.ts.map +1 -0
- package/dist/providers/elevenlabs/index.js +91 -0
- package/dist/providers/elevenlabs/index.js.map +1 -0
- package/dist/providers/fal/index.d.ts +35 -0
- package/dist/providers/fal/index.d.ts.map +1 -0
- package/dist/providers/fal/index.js +70 -0
- package/dist/providers/fal/index.js.map +1 -0
- package/dist/providers/fish-audio/index.d.ts +32 -0
- package/dist/providers/fish-audio/index.d.ts.map +1 -0
- package/dist/providers/fish-audio/index.js +54 -0
- package/dist/providers/fish-audio/index.js.map +1 -0
- package/dist/providers/google/index.d.ts +35 -0
- package/dist/providers/google/index.d.ts.map +1 -0
- package/dist/providers/google/index.js +71 -0
- package/dist/providers/google/index.js.map +1 -0
- package/dist/providers/hume/index.d.ts +36 -0
- package/dist/providers/hume/index.d.ts.map +1 -0
- package/dist/providers/hume/index.js +66 -0
- package/dist/providers/hume/index.js.map +1 -0
- package/dist/providers/mistral/index.d.ts +37 -0
- package/dist/providers/mistral/index.d.ts.map +1 -0
- package/dist/providers/mistral/index.js +66 -0
- package/dist/providers/mistral/index.js.map +1 -0
- package/dist/providers/murf/index.d.ts +35 -0
- package/dist/providers/murf/index.d.ts.map +1 -0
- package/dist/providers/murf/index.js +68 -0
- package/dist/providers/murf/index.js.map +1 -0
- package/dist/providers/openai/index.d.ts +39 -0
- package/dist/providers/openai/index.d.ts.map +1 -0
- package/dist/providers/openai/index.js +63 -0
- package/dist/providers/openai/index.js.map +1 -0
- package/dist/providers/openai/openai-options.d.ts +2 -0
- package/dist/providers/openai/openai-options.d.ts.map +1 -0
- package/dist/providers/openai/openai-options.js +2 -0
- package/dist/providers/openai/openai-options.js.map +1 -0
- package/dist/providers/openai/openai-provider.d.ts +5 -0
- package/dist/providers/openai/openai-provider.d.ts.map +1 -0
- package/dist/providers/openai/openai-provider.js +11 -0
- package/dist/providers/openai/openai-provider.js.map +1 -0
- package/dist/providers/openai/openai-speech-model.d.ts +39 -0
- package/dist/providers/openai/openai-speech-model.d.ts.map +1 -0
- package/dist/providers/openai/openai-speech-model.js +54 -0
- package/dist/providers/openai/openai-speech-model.js.map +1 -0
- package/dist/providers/resemble/index.d.ts +32 -0
- package/dist/providers/resemble/index.d.ts.map +1 -0
- package/dist/providers/resemble/index.js +50 -0
- package/dist/providers/resemble/index.js.map +1 -0
- package/dist/providers/unreal-speech/index.d.ts +32 -0
- package/dist/providers/unreal-speech/index.d.ts.map +1 -0
- package/dist/providers/unreal-speech/index.js +64 -0
- package/dist/providers/unreal-speech/index.js.map +1 -0
- package/dist/resolve-provider.d.ts +3 -0
- package/dist/resolve-provider.d.ts.map +1 -0
- package/dist/resolve-provider.js +71 -0
- package/dist/resolve-provider.js.map +1 -0
- package/dist/speech-provider.d.ts +31 -0
- package/dist/speech-provider.d.ts.map +1 -0
- package/dist/speech-provider.js +2 -0
- package/dist/speech-provider.js.map +1 -0
- package/dist/speech-result.d.ts +22 -0
- package/dist/speech-result.d.ts.map +1 -0
- package/dist/speech-result.js +42 -0
- package/dist/speech-result.js.map +1 -0
- package/dist/types.d.ts +11 -0
- package/dist/types.d.ts.map +1 -0
- package/dist/types.js +2 -0
- package/dist/types.js.map +1 -0
- package/package.json +96 -0
|
@@ -0,0 +1,32 @@
|
|
|
1
|
+
import type { SpeechProvider, ResolvedModel } from '../../speech-provider.js';
|
|
2
|
+
export interface ResembleSpeechProviderConfig {
|
|
3
|
+
apiKey?: string;
|
|
4
|
+
baseURL?: string;
|
|
5
|
+
fetch?: typeof globalThis.fetch;
|
|
6
|
+
}
|
|
7
|
+
export declare class ResembleSpeechProvider implements SpeechProvider<string, string> {
|
|
8
|
+
readonly id = "resemble";
|
|
9
|
+
readonly defaultModel = "default";
|
|
10
|
+
readonly models: readonly [{
|
|
11
|
+
readonly id: "default";
|
|
12
|
+
readonly languages: readonly ["en"];
|
|
13
|
+
}];
|
|
14
|
+
private readonly apiKey;
|
|
15
|
+
private readonly baseURL;
|
|
16
|
+
private readonly fetchFn;
|
|
17
|
+
constructor(config: ResembleSpeechProviderConfig);
|
|
18
|
+
generate(options: {
|
|
19
|
+
modelId: string;
|
|
20
|
+
text: string;
|
|
21
|
+
voice?: string;
|
|
22
|
+
providerOptions?: Record<string, unknown>;
|
|
23
|
+
abortSignal?: AbortSignal;
|
|
24
|
+
headers?: Record<string, string>;
|
|
25
|
+
}): Promise<{
|
|
26
|
+
audio: string;
|
|
27
|
+
mediaType: string;
|
|
28
|
+
providerMetadata?: Record<string, unknown>;
|
|
29
|
+
}>;
|
|
30
|
+
}
|
|
31
|
+
export declare function createResemble(config?: ResembleSpeechProviderConfig): (modelId?: string) => ResolvedModel<string>;
|
|
32
|
+
//# sourceMappingURL=index.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"index.d.ts","sourceRoot":"","sources":["../../../src/providers/resemble/index.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,EAAE,cAAc,EAAE,aAAa,EAAE,MAAM,0BAA0B,CAAC;AAG9E,MAAM,WAAW,4BAA4B;IAC3C,MAAM,CAAC,EAAE,MAAM,CAAC;IAChB,OAAO,CAAC,EAAE,MAAM,CAAC;IACjB,KAAK,CAAC,EAAE,OAAO,UAAU,CAAC,KAAK,CAAC;CACjC;AAED,qBAAa,sBAAuB,YAAW,cAAc,CAAC,MAAM,EAAE,MAAM,CAAC;IAC3E,QAAQ,CAAC,EAAE,cAAc;IACzB,QAAQ,CAAC,YAAY,aAAa;IAElC,QAAQ,CAAC,MAAM;;;OAEJ;IAEX,OAAO,CAAC,QAAQ,CAAC,MAAM,CAAqB;IAC5C,OAAO,CAAC,QAAQ,CAAC,OAAO,CAAS;IACjC,OAAO,CAAC,QAAQ,CAAC,OAAO,CAA0B;gBAEtC,MAAM,EAAE,4BAA4B;IAM1C,QAAQ,CAAC,OAAO,EAAE;QACtB,OAAO,EAAE,MAAM,CAAC;QAChB,IAAI,EAAE,MAAM,CAAC;QACb,KAAK,CAAC,EAAE,MAAM,CAAC;QACf,eAAe,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,CAAC;QAC1C,WAAW,CAAC,EAAE,WAAW,CAAC;QAC1B,OAAO,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,MAAM,CAAC,CAAC;KAClC,GAAG,OAAO,CAAC;QACV,KAAK,EAAE,MAAM,CAAC;QACd,SAAS,EAAE,MAAM,CAAC;QAClB,gBAAgB,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,CAAC;KAC5C,CAAC;CA6BH;AAED,wBAAgB,cAAc,CAAC,MAAM,GAAE,4BAAiC,IAG7C,UAAU,MAAM,KAAG,aAAa,CAAC,MAAM,CAAC,CAMlE"}
|
|
@@ -0,0 +1,50 @@
|
|
|
1
|
+
import { resolveApiKey, handleErrorResponse } from '../../provider-utils.js';
|
|
2
|
+
export class ResembleSpeechProvider {
|
|
3
|
+
id = 'resemble';
|
|
4
|
+
defaultModel = 'default';
|
|
5
|
+
models = [
|
|
6
|
+
{ id: 'default', languages: ['en'] },
|
|
7
|
+
];
|
|
8
|
+
apiKey;
|
|
9
|
+
baseURL;
|
|
10
|
+
fetchFn;
|
|
11
|
+
constructor(config) {
|
|
12
|
+
this.apiKey = config.apiKey;
|
|
13
|
+
this.baseURL = config.baseURL ?? 'https://f.cluster.resemble.ai';
|
|
14
|
+
this.fetchFn = config.fetch ?? globalThis.fetch;
|
|
15
|
+
}
|
|
16
|
+
async generate(options) {
|
|
17
|
+
const url = `${this.baseURL}/synthesize`;
|
|
18
|
+
const body = {
|
|
19
|
+
...options.providerOptions,
|
|
20
|
+
voice_uuid: options.voice,
|
|
21
|
+
data: options.text,
|
|
22
|
+
};
|
|
23
|
+
const response = await this.fetchFn(url, {
|
|
24
|
+
method: 'POST',
|
|
25
|
+
headers: {
|
|
26
|
+
'Content-Type': 'application/json',
|
|
27
|
+
'Authorization': resolveApiKey(this.apiKey, 'RESEMBLE_API_KEY', 'Resemble'),
|
|
28
|
+
...options.headers,
|
|
29
|
+
},
|
|
30
|
+
body: JSON.stringify(body),
|
|
31
|
+
signal: options.abortSignal,
|
|
32
|
+
});
|
|
33
|
+
await handleErrorResponse(response, `resemble/${options.modelId}`);
|
|
34
|
+
const json = await response.json();
|
|
35
|
+
return {
|
|
36
|
+
audio: json.audio_content,
|
|
37
|
+
mediaType: 'audio/wav',
|
|
38
|
+
};
|
|
39
|
+
}
|
|
40
|
+
}
|
|
41
|
+
export function createResemble(config = {}) {
|
|
42
|
+
const provider = new ResembleSpeechProvider(config);
|
|
43
|
+
return function resemble(modelId) {
|
|
44
|
+
return {
|
|
45
|
+
provider,
|
|
46
|
+
modelId: modelId ?? provider.defaultModel,
|
|
47
|
+
};
|
|
48
|
+
};
|
|
49
|
+
}
|
|
50
|
+
//# sourceMappingURL=index.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"index.js","sourceRoot":"","sources":["../../../src/providers/resemble/index.ts"],"names":[],"mappings":"AACA,OAAO,EAAE,aAAa,EAAE,mBAAmB,EAAE,MAAM,yBAAyB,CAAC;AAQ7E,MAAM,OAAO,sBAAsB;IACxB,EAAE,GAAG,UAAU,CAAC;IAChB,YAAY,GAAG,SAAS,CAAC;IAEzB,MAAM,GAAG;QAChB,EAAE,EAAE,EAAE,SAAS,EAAE,SAAS,EAAE,CAAC,IAAI,CAAC,EAAE;KAC5B,CAAC;IAEM,MAAM,CAAqB;IAC3B,OAAO,CAAS;IAChB,OAAO,CAA0B;IAElD,YAAY,MAAoC;QAC9C,IAAI,CAAC,MAAM,GAAG,MAAM,CAAC,MAAM,CAAC;QAC5B,IAAI,CAAC,OAAO,GAAG,MAAM,CAAC,OAAO,IAAI,+BAA+B,CAAC;QACjE,IAAI,CAAC,OAAO,GAAG,MAAM,CAAC,KAAK,IAAI,UAAU,CAAC,KAAK,CAAC;IAClD,CAAC;IAED,KAAK,CAAC,QAAQ,CAAC,OAOd;QAKC,MAAM,GAAG,GAAG,GAAG,IAAI,CAAC,OAAO,aAAa,CAAC;QAEzC,MAAM,IAAI,GAA4B;YACpC,GAAG,OAAO,CAAC,eAAe;YAC1B,UAAU,EAAE,OAAO,CAAC,KAAK;YACzB,IAAI,EAAE,OAAO,CAAC,IAAI;SACnB,CAAC;QAEF,MAAM,QAAQ,GAAG,MAAM,IAAI,CAAC,OAAO,CAAC,GAAG,EAAE;YACvC,MAAM,EAAE,MAAM;YACd,OAAO,EAAE;gBACP,cAAc,EAAE,kBAAkB;gBAClC,eAAe,EAAE,aAAa,CAAC,IAAI,CAAC,MAAM,EAAE,kBAAkB,EAAE,UAAU,CAAC;gBAC3E,GAAG,OAAO,CAAC,OAAO;aACnB;YACD,IAAI,EAAE,IAAI,CAAC,SAAS,CAAC,IAAI,CAAC;YAC1B,MAAM,EAAE,OAAO,CAAC,WAAW;SAC5B,CAAC,CAAC;QAEH,MAAM,mBAAmB,CAAC,QAAQ,EAAE,YAAY,OAAO,CAAC,OAAO,EAAE,CAAC,CAAC;QAEnE,MAAM,IAAI,GAAG,MAAM,QAAQ,CAAC,IAAI,EAA+B,CAAC;QAEhE,OAAO;YACL,KAAK,EAAE,IAAI,CAAC,aAAa;YACzB,SAAS,EAAE,WAAW;SACvB,CAAC;IACJ,CAAC;CACF;AAED,MAAM,UAAU,cAAc,CAAC,SAAuC,EAAE;IACtE,MAAM,QAAQ,GAAG,IAAI,sBAAsB,CAAC,MAAM,CAAC,CAAC;IAEpD,OAAO,SAAS,QAAQ,CAAC,OAAgB;QACvC,OAAO;YACL,QAAQ;YACR,OAAO,EAAE,OAAO,IAAI,QAAQ,CAAC,YAAY;SAC1C,CAAC;IACJ,CAAC,CAAC;AACJ,CAAC"}
|
|
@@ -0,0 +1,32 @@
|
|
|
1
|
+
import type { SpeechProvider, ResolvedModel } from '../../speech-provider.js';
|
|
2
|
+
export interface UnrealSpeechProviderConfig {
|
|
3
|
+
apiKey?: string;
|
|
4
|
+
baseURL?: string;
|
|
5
|
+
fetch?: typeof globalThis.fetch;
|
|
6
|
+
}
|
|
7
|
+
export declare class UnrealSpeechProvider implements SpeechProvider<string, string> {
|
|
8
|
+
readonly id = "unreal-speech";
|
|
9
|
+
readonly defaultModel = "default";
|
|
10
|
+
readonly models: readonly [{
|
|
11
|
+
readonly id: "default";
|
|
12
|
+
readonly languages: readonly ["en"];
|
|
13
|
+
}];
|
|
14
|
+
private readonly apiKey;
|
|
15
|
+
private readonly baseURL;
|
|
16
|
+
private readonly fetchFn;
|
|
17
|
+
constructor(config: UnrealSpeechProviderConfig);
|
|
18
|
+
generate(options: {
|
|
19
|
+
modelId: string;
|
|
20
|
+
text: string;
|
|
21
|
+
voice?: string;
|
|
22
|
+
providerOptions?: Record<string, unknown>;
|
|
23
|
+
abortSignal?: AbortSignal;
|
|
24
|
+
headers?: Record<string, string>;
|
|
25
|
+
}): Promise<{
|
|
26
|
+
audio: Uint8Array;
|
|
27
|
+
mediaType: string;
|
|
28
|
+
providerMetadata?: Record<string, unknown>;
|
|
29
|
+
}>;
|
|
30
|
+
}
|
|
31
|
+
export declare function createUnrealSpeech(config?: UnrealSpeechProviderConfig): (modelId?: string) => ResolvedModel<string>;
|
|
32
|
+
//# sourceMappingURL=index.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"index.d.ts","sourceRoot":"","sources":["../../../src/providers/unreal-speech/index.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,EAAE,cAAc,EAAE,aAAa,EAAE,MAAM,0BAA0B,CAAC;AAI9E,MAAM,WAAW,0BAA0B;IACzC,MAAM,CAAC,EAAE,MAAM,CAAC;IAChB,OAAO,CAAC,EAAE,MAAM,CAAC;IACjB,KAAK,CAAC,EAAE,OAAO,UAAU,CAAC,KAAK,CAAC;CACjC;AAED,qBAAa,oBAAqB,YAAW,cAAc,CAAC,MAAM,EAAE,MAAM,CAAC;IACzE,QAAQ,CAAC,EAAE,mBAAmB;IAC9B,QAAQ,CAAC,YAAY,aAAa;IAElC,QAAQ,CAAC,MAAM;;;OAEJ;IAEX,OAAO,CAAC,QAAQ,CAAC,MAAM,CAAqB;IAC5C,OAAO,CAAC,QAAQ,CAAC,OAAO,CAAS;IACjC,OAAO,CAAC,QAAQ,CAAC,OAAO,CAA0B;gBAEtC,MAAM,EAAE,0BAA0B;IAMxC,QAAQ,CAAC,OAAO,EAAE;QACtB,OAAO,EAAE,MAAM,CAAC;QAChB,IAAI,EAAE,MAAM,CAAC;QACb,KAAK,CAAC,EAAE,MAAM,CAAC;QACf,eAAe,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,CAAC;QAC1C,WAAW,CAAC,EAAE,WAAW,CAAC;QAC1B,OAAO,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,MAAM,CAAC,CAAC;KAClC,GAAG,OAAO,CAAC;QACV,KAAK,EAAE,UAAU,CAAC;QAClB,SAAS,EAAE,MAAM,CAAC;QAClB,gBAAgB,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,CAAC;KAC5C,CAAC;CA6CH;AAED,wBAAgB,kBAAkB,CAAC,MAAM,GAAE,0BAA+B,IAG3C,UAAU,MAAM,KAAG,aAAa,CAAC,MAAM,CAAC,CAMtE"}
|
|
@@ -0,0 +1,64 @@
|
|
|
1
|
+
import { resolveApiKey, handleErrorResponse } from '../../provider-utils.js';
|
|
2
|
+
import { ApiError } from '../../errors.js';
|
|
3
|
+
export class UnrealSpeechProvider {
|
|
4
|
+
id = 'unreal-speech';
|
|
5
|
+
defaultModel = 'default';
|
|
6
|
+
models = [
|
|
7
|
+
{ id: 'default', languages: ['en'] },
|
|
8
|
+
];
|
|
9
|
+
apiKey;
|
|
10
|
+
baseURL;
|
|
11
|
+
fetchFn;
|
|
12
|
+
constructor(config) {
|
|
13
|
+
this.apiKey = config.apiKey;
|
|
14
|
+
this.baseURL = config.baseURL ?? 'https://api.v8.unrealspeech.com';
|
|
15
|
+
this.fetchFn = config.fetch ?? globalThis.fetch;
|
|
16
|
+
}
|
|
17
|
+
async generate(options) {
|
|
18
|
+
const url = `${this.baseURL}/speech`;
|
|
19
|
+
const body = {
|
|
20
|
+
...options.providerOptions,
|
|
21
|
+
AudioFormat: 'mp3',
|
|
22
|
+
OutputFormat: 'uri',
|
|
23
|
+
VoiceId: options.voice,
|
|
24
|
+
Text: options.text,
|
|
25
|
+
};
|
|
26
|
+
const response = await this.fetchFn(url, {
|
|
27
|
+
method: 'POST',
|
|
28
|
+
headers: {
|
|
29
|
+
'Content-Type': 'application/json',
|
|
30
|
+
'Authorization': `Bearer ${resolveApiKey(this.apiKey, 'UNREAL_SPEECH_API_KEY', 'Unreal Speech')}`,
|
|
31
|
+
...options.headers,
|
|
32
|
+
},
|
|
33
|
+
body: JSON.stringify(body),
|
|
34
|
+
signal: options.abortSignal,
|
|
35
|
+
});
|
|
36
|
+
await handleErrorResponse(response, `unreal-speech/${options.modelId}`);
|
|
37
|
+
const json = await response.json();
|
|
38
|
+
const audioResponse = await this.fetchFn(json.OutputUri, {
|
|
39
|
+
signal: options.abortSignal,
|
|
40
|
+
});
|
|
41
|
+
if (!audioResponse.ok) {
|
|
42
|
+
throw new ApiError(`API error: ${audioResponse.status}`, {
|
|
43
|
+
statusCode: audioResponse.status,
|
|
44
|
+
model: `unreal-speech/${options.modelId}`,
|
|
45
|
+
responseBody: await audioResponse.text().catch(() => undefined),
|
|
46
|
+
});
|
|
47
|
+
}
|
|
48
|
+
const arrayBuffer = await audioResponse.arrayBuffer();
|
|
49
|
+
return {
|
|
50
|
+
audio: new Uint8Array(arrayBuffer),
|
|
51
|
+
mediaType: 'audio/mpeg',
|
|
52
|
+
};
|
|
53
|
+
}
|
|
54
|
+
}
|
|
55
|
+
export function createUnrealSpeech(config = {}) {
|
|
56
|
+
const provider = new UnrealSpeechProvider(config);
|
|
57
|
+
return function unrealSpeech(modelId) {
|
|
58
|
+
return {
|
|
59
|
+
provider,
|
|
60
|
+
modelId: modelId ?? provider.defaultModel,
|
|
61
|
+
};
|
|
62
|
+
};
|
|
63
|
+
}
|
|
64
|
+
//# sourceMappingURL=index.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"index.js","sourceRoot":"","sources":["../../../src/providers/unreal-speech/index.ts"],"names":[],"mappings":"AACA,OAAO,EAAE,aAAa,EAAE,mBAAmB,EAAE,MAAM,yBAAyB,CAAC;AAC7E,OAAO,EAAE,QAAQ,EAAE,MAAM,iBAAiB,CAAC;AAQ3C,MAAM,OAAO,oBAAoB;IACtB,EAAE,GAAG,eAAe,CAAC;IACrB,YAAY,GAAG,SAAS,CAAC;IAEzB,MAAM,GAAG;QAChB,EAAE,EAAE,EAAE,SAAS,EAAE,SAAS,EAAE,CAAC,IAAI,CAAC,EAAE;KAC5B,CAAC;IAEM,MAAM,CAAqB;IAC3B,OAAO,CAAS;IAChB,OAAO,CAA0B;IAElD,YAAY,MAAkC;QAC5C,IAAI,CAAC,MAAM,GAAG,MAAM,CAAC,MAAM,CAAC;QAC5B,IAAI,CAAC,OAAO,GAAG,MAAM,CAAC,OAAO,IAAI,iCAAiC,CAAC;QACnE,IAAI,CAAC,OAAO,GAAG,MAAM,CAAC,KAAK,IAAI,UAAU,CAAC,KAAK,CAAC;IAClD,CAAC;IAED,KAAK,CAAC,QAAQ,CAAC,OAOd;QAKC,MAAM,GAAG,GAAG,GAAG,IAAI,CAAC,OAAO,SAAS,CAAC;QAErC,MAAM,IAAI,GAA4B;YACpC,GAAG,OAAO,CAAC,eAAe;YAC1B,WAAW,EAAE,KAAK;YAClB,YAAY,EAAE,KAAK;YACnB,OAAO,EAAE,OAAO,CAAC,KAAK;YACtB,IAAI,EAAE,OAAO,CAAC,IAAI;SACnB,CAAC;QAEF,MAAM,QAAQ,GAAG,MAAM,IAAI,CAAC,OAAO,CAAC,GAAG,EAAE;YACvC,MAAM,EAAE,MAAM;YACd,OAAO,EAAE;gBACP,cAAc,EAAE,kBAAkB;gBAClC,eAAe,EAAE,UAAU,aAAa,CAAC,IAAI,CAAC,MAAM,EAAE,uBAAuB,EAAE,eAAe,CAAC,EAAE;gBACjG,GAAG,OAAO,CAAC,OAAO;aACnB;YACD,IAAI,EAAE,IAAI,CAAC,SAAS,CAAC,IAAI,CAAC;YAC1B,MAAM,EAAE,OAAO,CAAC,WAAW;SAC5B,CAAC,CAAC;QAEH,MAAM,mBAAmB,CAAC,QAAQ,EAAE,iBAAiB,OAAO,CAAC,OAAO,EAAE,CAAC,CAAC;QAExE,MAAM,IAAI,GAAG,MAAM,QAAQ,CAAC,IAAI,EAA2B,CAAC;QAE5D,MAAM,aAAa,GAAG,MAAM,IAAI,CAAC,OAAO,CAAC,IAAI,CAAC,SAAS,EAAE;YACvD,MAAM,EAAE,OAAO,CAAC,WAAW;SAC5B,CAAC,CAAC;QAEH,IAAI,CAAC,aAAa,CAAC,EAAE,EAAE,CAAC;YACtB,MAAM,IAAI,QAAQ,CAAC,cAAc,aAAa,CAAC,MAAM,EAAE,EAAE;gBACvD,UAAU,EAAE,aAAa,CAAC,MAAM;gBAChC,KAAK,EAAE,iBAAiB,OAAO,CAAC,OAAO,EAAE;gBACzC,YAAY,EAAE,MAAM,aAAa,CAAC,IAAI,EAAE,CAAC,KAAK,CAAC,GAAG,EAAE,CAAC,SAAS,CAAC;aAChE,CAAC,CAAC;QACL,CAAC;QAED,MAAM,WAAW,GAAG,MAAM,aAAa,CAAC,WAAW,EAAE,CAAC;QAEtD,OAAO;YACL,KAAK,EAAE,IAAI,UAAU,CAAC,WAAW,CAAC;YAClC,SAAS,EAAE,YAAY;SACxB,CAAC;IACJ,CAAC;CACF;AAED,MAAM,UAAU,kBAAkB,CAAC,SAAqC,EAAE;IACxE,MAAM,QAAQ,GAAG,IAAI,oBAAoB,CAAC,MAAM,CAAC,CAAC;IAElD,OAAO,SAAS,YAAY,CAAC,OAAgB;QAC3C,OAAO;YACL,QAAQ;YACR,OAAO,EAAE,OAAO,IAAI,QAAQ,CAAC,YAAY;SAC1C,CAAC;IACJ,CAAC,CAAC;AACJ,CAAC"}
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"resolve-provider.d.ts","sourceRoot":"","sources":["../src/resolve-provider.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,EAAkB,aAAa,EAAE,MAAM,sBAAsB,CAAC;AAuD1E,wBAAgB,YAAY,CAC1B,KAAK,EAAE,MAAM,GAAG,aAAa,GAC5B,aAAa,CAsBf"}
|
|
@@ -0,0 +1,71 @@
|
|
|
1
|
+
import { SpeechSDKError } from './errors.js';
|
|
2
|
+
import { OpenAISpeechProvider } from './providers/openai/index.js';
|
|
3
|
+
import { ElevenLabsSpeechProvider } from './providers/elevenlabs/index.js';
|
|
4
|
+
import { DeepgramSpeechProvider } from './providers/deepgram/index.js';
|
|
5
|
+
import { CartesiaSpeechProvider } from './providers/cartesia/index.js';
|
|
6
|
+
import { HumeSpeechProvider } from './providers/hume/index.js';
|
|
7
|
+
import { GoogleSpeechProvider } from './providers/google/index.js';
|
|
8
|
+
import { FishAudioSpeechProvider } from './providers/fish-audio/index.js';
|
|
9
|
+
import { UnrealSpeechProvider } from './providers/unreal-speech/index.js';
|
|
10
|
+
import { MurfSpeechProvider } from './providers/murf/index.js';
|
|
11
|
+
import { ResembleSpeechProvider } from './providers/resemble/index.js';
|
|
12
|
+
import { FalSpeechProvider } from './providers/fal/index.js';
|
|
13
|
+
import { MistralSpeechProvider } from './providers/mistral/index.js';
|
|
14
|
+
function isResolvedModel(model) {
|
|
15
|
+
return (model != null &&
|
|
16
|
+
typeof model === 'object' &&
|
|
17
|
+
'provider' in model &&
|
|
18
|
+
'modelId' in model);
|
|
19
|
+
}
|
|
20
|
+
function createBuiltinProvider(name) {
|
|
21
|
+
switch (name) {
|
|
22
|
+
case 'openai':
|
|
23
|
+
return new OpenAISpeechProvider({});
|
|
24
|
+
case 'elevenlabs':
|
|
25
|
+
return new ElevenLabsSpeechProvider({});
|
|
26
|
+
case 'deepgram':
|
|
27
|
+
return new DeepgramSpeechProvider({});
|
|
28
|
+
case 'cartesia':
|
|
29
|
+
return new CartesiaSpeechProvider({});
|
|
30
|
+
case 'hume':
|
|
31
|
+
return new HumeSpeechProvider({});
|
|
32
|
+
case 'google':
|
|
33
|
+
return new GoogleSpeechProvider({});
|
|
34
|
+
case 'fish-audio':
|
|
35
|
+
return new FishAudioSpeechProvider({});
|
|
36
|
+
case 'unreal-speech':
|
|
37
|
+
return new UnrealSpeechProvider({});
|
|
38
|
+
case 'murf':
|
|
39
|
+
return new MurfSpeechProvider({});
|
|
40
|
+
case 'resemble':
|
|
41
|
+
return new ResembleSpeechProvider({});
|
|
42
|
+
case 'fal-ai':
|
|
43
|
+
return new FalSpeechProvider({});
|
|
44
|
+
case 'mistral':
|
|
45
|
+
return new MistralSpeechProvider({});
|
|
46
|
+
default:
|
|
47
|
+
throw new SpeechSDKError(`Unknown provider: ${name}`);
|
|
48
|
+
}
|
|
49
|
+
}
|
|
50
|
+
export function resolveModel(model) {
|
|
51
|
+
if (isResolvedModel(model)) {
|
|
52
|
+
return model;
|
|
53
|
+
}
|
|
54
|
+
const slashIndex = model.indexOf('/');
|
|
55
|
+
let providerName;
|
|
56
|
+
let modelId;
|
|
57
|
+
if (slashIndex !== -1) {
|
|
58
|
+
providerName = model.slice(0, slashIndex);
|
|
59
|
+
modelId = model.slice(slashIndex + 1);
|
|
60
|
+
}
|
|
61
|
+
else {
|
|
62
|
+
providerName = model;
|
|
63
|
+
modelId = undefined;
|
|
64
|
+
}
|
|
65
|
+
const provider = createBuiltinProvider(providerName);
|
|
66
|
+
return {
|
|
67
|
+
provider,
|
|
68
|
+
modelId: modelId || provider.defaultModel,
|
|
69
|
+
};
|
|
70
|
+
}
|
|
71
|
+
//# sourceMappingURL=resolve-provider.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"resolve-provider.js","sourceRoot":"","sources":["../src/resolve-provider.ts"],"names":[],"mappings":"AACA,OAAO,EAAE,cAAc,EAAE,MAAM,aAAa,CAAC;AAC7C,OAAO,EAAE,oBAAoB,EAAE,MAAM,6BAA6B,CAAC;AACnE,OAAO,EAAE,wBAAwB,EAAE,MAAM,iCAAiC,CAAC;AAC3E,OAAO,EAAE,sBAAsB,EAAE,MAAM,+BAA+B,CAAC;AACvE,OAAO,EAAE,sBAAsB,EAAE,MAAM,+BAA+B,CAAC;AACvE,OAAO,EAAE,kBAAkB,EAAE,MAAM,2BAA2B,CAAC;AAC/D,OAAO,EAAE,oBAAoB,EAAE,MAAM,6BAA6B,CAAC;AACnE,OAAO,EAAE,uBAAuB,EAAE,MAAM,iCAAiC,CAAC;AAC1E,OAAO,EAAE,oBAAoB,EAAE,MAAM,oCAAoC,CAAC;AAC1E,OAAO,EAAE,kBAAkB,EAAE,MAAM,2BAA2B,CAAC;AAC/D,OAAO,EAAE,sBAAsB,EAAE,MAAM,+BAA+B,CAAC;AACvE,OAAO,EAAE,iBAAiB,EAAE,MAAM,0BAA0B,CAAC;AAC7D,OAAO,EAAE,qBAAqB,EAAE,MAAM,8BAA8B,CAAC;AAErE,SAAS,eAAe,CAAC,KAAc;IACrC,OAAO,CACL,KAAK,IAAI,IAAI;QACb,OAAO,KAAK,KAAK,QAAQ;QACzB,UAAU,IAAI,KAAK;QACnB,SAAS,IAAI,KAAK,CACnB,CAAC;AACJ,CAAC;AAED,SAAS,qBAAqB,CAAC,IAAY;IACzC,QAAQ,IAAI,EAAE,CAAC;QACb,KAAK,QAAQ;YACX,OAAO,IAAI,oBAAoB,CAAC,EAAE,CAAC,CAAC;QACtC,KAAK,YAAY;YACf,OAAO,IAAI,wBAAwB,CAAC,EAAE,CAAC,CAAC;QAC1C,KAAK,UAAU;YACb,OAAO,IAAI,sBAAsB,CAAC,EAAE,CAAC,CAAC;QACxC,KAAK,UAAU;YACb,OAAO,IAAI,sBAAsB,CAAC,EAAE,CAAC,CAAC;QAC5C,KAAK,MAAM;YACL,OAAO,IAAI,kBAAkB,CAAC,EAAE,CAAC,CAAC;QACpC,KAAK,QAAQ;YACX,OAAO,IAAI,oBAAoB,CAAC,EAAE,CAAC,CAAC;QAC1C,KAAK,YAAY;YACX,OAAO,IAAI,uBAAuB,CAAC,EAAE,CAAC,CAAC;QACzC,KAAK,eAAe;YAClB,OAAO,IAAI,oBAAoB,CAAC,EAAE,CAAC,CAAC;QACtC,KAAK,MAAM;YACT,OAAO,IAAI,kBAAkB,CAAC,EAAE,CAAC,CAAC;QACpC,KAAK,UAAU;YACb,OAAO,IAAI,sBAAsB,CAAC,EAAE,CAAC,CAAC;QAC5C,KAAK,QAAQ;YACP,OAAO,IAAI,iBAAiB,CAAC,EAAE,CAAC,CAAC;QACnC,KAAK,SAAS;YACZ,OAAO,IAAI,qBAAqB,CAAC,EAAE,CAAC,CAAC;QACvC;YACE,MAAM,IAAI,cAAc,CAAC,qBAAqB,IAAI,EAAE,CAAC,CAAC;IAC1D,CAAC;AACH,CAAC;AAED,MAAM,UAAU,YAAY,CAC1B,KAA6B;IAE7B,IAAI,eAAe,CAAC,KAAK,CAAC,EAAE,CAAC;QAC3B,OAAO,KAAK,CAAC;IACf,CAAC;IAED,MAAM,UAAU,GAAG,KAAK,CAAC,OAAO,CAAC,GAAG,CAAC,CAAC;IACtC,IAAI,YAAoB,CAAC;IACzB,IAAI,OAA2B,CAAC;IAEhC,IAAI,UAAU,KAAK,CAAC,CAAC,EAAE,CAAC;QACtB,YAAY,GAAG,KAAK,CAAC,KAAK,CAAC,CAAC,EAAE,UAAU,CAAC,CAAC;QAC1C,OAAO,GAAG,KAAK,CAAC,KAAK,CAAC,UAAU,GAAG,CAAC,CAAC,CAAC;IACxC,CAAC;SAAM,CAAC;QACN,YAAY,GAAG,KAAK,CAAC;QACrB,OAAO,GAAG,SAAS,CAAC;IACtB,CAAC;IAED,MAAM,QAAQ,GAAG,qBAAqB,CAAC,YAAY,CAAC,CAAC;IACrD,OAAO;QACL,QAAQ;QACR,OAAO,EAAE,OAAO,IAAI,QAAQ,CAAC,YAAY;KAC1C,CAAC;AACJ,CAAC"}
|
|
@@ -0,0 +1,31 @@
|
|
|
1
|
+
export type Voice = string | {
|
|
2
|
+
url: string;
|
|
3
|
+
} | {
|
|
4
|
+
audio: string | Uint8Array;
|
|
5
|
+
};
|
|
6
|
+
export interface ModelInfo {
|
|
7
|
+
id: string;
|
|
8
|
+
languages: readonly string[];
|
|
9
|
+
}
|
|
10
|
+
export interface SpeechProvider<TModel extends string = string, TVoice extends Voice = Voice> {
|
|
11
|
+
id: string;
|
|
12
|
+
defaultModel: TModel;
|
|
13
|
+
models: readonly ModelInfo[];
|
|
14
|
+
generate(options: {
|
|
15
|
+
modelId: string;
|
|
16
|
+
text: string;
|
|
17
|
+
voice?: TVoice;
|
|
18
|
+
providerOptions?: Record<string, unknown>;
|
|
19
|
+
abortSignal?: AbortSignal;
|
|
20
|
+
headers?: Record<string, string>;
|
|
21
|
+
}): Promise<{
|
|
22
|
+
audio: string | Uint8Array;
|
|
23
|
+
mediaType: string;
|
|
24
|
+
providerMetadata?: Record<string, unknown>;
|
|
25
|
+
}>;
|
|
26
|
+
}
|
|
27
|
+
export interface ResolvedModel<TVoice extends Voice = Voice> {
|
|
28
|
+
provider: SpeechProvider<string, TVoice>;
|
|
29
|
+
modelId: string;
|
|
30
|
+
}
|
|
31
|
+
//# sourceMappingURL=speech-provider.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"speech-provider.d.ts","sourceRoot":"","sources":["../src/speech-provider.ts"],"names":[],"mappings":"AAAA,MAAM,MAAM,KAAK,GACb,MAAM,GACN;IAAE,GAAG,EAAE,MAAM,CAAA;CAAE,GACf;IAAE,KAAK,EAAE,MAAM,GAAG,UAAU,CAAA;CAAE,CAAA;AAElC,MAAM,WAAW,SAAS;IACxB,EAAE,EAAE,MAAM,CAAC;IACX,SAAS,EAAE,SAAS,MAAM,EAAE,CAAC;CAC9B;AAED,MAAM,WAAW,cAAc,CAC7B,MAAM,SAAS,MAAM,GAAG,MAAM,EAC9B,MAAM,SAAS,KAAK,GAAG,KAAK;IAE5B,EAAE,EAAE,MAAM,CAAC;IACX,YAAY,EAAE,MAAM,CAAC;IACrB,MAAM,EAAE,SAAS,SAAS,EAAE,CAAC;IAE7B,QAAQ,CAAC,OAAO,EAAE;QAChB,OAAO,EAAE,MAAM,CAAC;QAChB,IAAI,EAAE,MAAM,CAAC;QACb,KAAK,CAAC,EAAE,MAAM,CAAC;QACf,eAAe,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,CAAC;QAC1C,WAAW,CAAC,EAAE,WAAW,CAAC;QAC1B,OAAO,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,MAAM,CAAC,CAAC;KAClC,GAAG,OAAO,CAAC;QACV,KAAK,EAAE,MAAM,GAAG,UAAU,CAAC;QAC3B,SAAS,EAAE,MAAM,CAAC;QAClB,gBAAgB,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,CAAC;KAC5C,CAAC,CAAC;CACJ;AAED,MAAM,WAAW,aAAa,CAAC,MAAM,SAAS,KAAK,GAAG,KAAK;IACzD,QAAQ,EAAE,cAAc,CAAC,MAAM,EAAE,MAAM,CAAC,CAAC;IACzC,OAAO,EAAE,MAAM,CAAC;CACjB"}
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"speech-provider.js","sourceRoot":"","sources":["../src/speech-provider.ts"],"names":[],"mappings":""}
|
|
@@ -0,0 +1,22 @@
|
|
|
1
|
+
export interface GeneratedAudioFile {
|
|
2
|
+
readonly uint8Array: Uint8Array;
|
|
3
|
+
readonly base64: string;
|
|
4
|
+
readonly mediaType: string;
|
|
5
|
+
}
|
|
6
|
+
export interface SpeechResult {
|
|
7
|
+
readonly audio: GeneratedAudioFile;
|
|
8
|
+
readonly providerMetadata?: Record<string, unknown>;
|
|
9
|
+
}
|
|
10
|
+
export declare class DefaultGeneratedAudioFile implements GeneratedAudioFile {
|
|
11
|
+
readonly mediaType: string;
|
|
12
|
+
private _data;
|
|
13
|
+
private _uint8Array?;
|
|
14
|
+
private _base64?;
|
|
15
|
+
constructor({ data, mediaType }: {
|
|
16
|
+
data: string | Uint8Array;
|
|
17
|
+
mediaType: string;
|
|
18
|
+
});
|
|
19
|
+
get uint8Array(): Uint8Array;
|
|
20
|
+
get base64(): string;
|
|
21
|
+
}
|
|
22
|
+
//# sourceMappingURL=speech-result.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"speech-result.d.ts","sourceRoot":"","sources":["../src/speech-result.ts"],"names":[],"mappings":"AAAA,MAAM,WAAW,kBAAkB;IACjC,QAAQ,CAAC,UAAU,EAAE,UAAU,CAAC;IAChC,QAAQ,CAAC,MAAM,EAAE,MAAM,CAAC;IACxB,QAAQ,CAAC,SAAS,EAAE,MAAM,CAAC;CAC5B;AAED,MAAM,WAAW,YAAY;IAC3B,QAAQ,CAAC,KAAK,EAAE,kBAAkB,CAAC;IACnC,QAAQ,CAAC,gBAAgB,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,CAAC;CACrD;AAED,qBAAa,yBAA0B,YAAW,kBAAkB;IAClE,QAAQ,CAAC,SAAS,EAAE,MAAM,CAAC;IAE3B,OAAO,CAAC,KAAK,CAAsB;IACnC,OAAO,CAAC,WAAW,CAAC,CAAa;IACjC,OAAO,CAAC,OAAO,CAAC,CAAS;gBAEb,EAAE,IAAI,EAAE,SAAS,EAAE,EAAE;QAAE,IAAI,EAAE,MAAM,GAAG,UAAU,CAAC;QAAC,SAAS,EAAE,MAAM,CAAA;KAAE;IAKjF,IAAI,UAAU,IAAI,UAAU,CAa3B;IAED,IAAI,MAAM,IAAI,MAAM,CAYnB;CACF"}
|
|
@@ -0,0 +1,42 @@
|
|
|
1
|
+
export class DefaultGeneratedAudioFile {
|
|
2
|
+
mediaType;
|
|
3
|
+
_data;
|
|
4
|
+
_uint8Array;
|
|
5
|
+
_base64;
|
|
6
|
+
constructor({ data, mediaType }) {
|
|
7
|
+
this._data = data;
|
|
8
|
+
this.mediaType = mediaType;
|
|
9
|
+
}
|
|
10
|
+
get uint8Array() {
|
|
11
|
+
if (this._uint8Array != null)
|
|
12
|
+
return this._uint8Array;
|
|
13
|
+
if (this._data instanceof Uint8Array) {
|
|
14
|
+
this._uint8Array = this._data;
|
|
15
|
+
}
|
|
16
|
+
else {
|
|
17
|
+
const binaryString = atob(this._data);
|
|
18
|
+
const bytes = new Uint8Array(binaryString.length);
|
|
19
|
+
for (let i = 0; i < binaryString.length; i++) {
|
|
20
|
+
bytes[i] = binaryString.charCodeAt(i);
|
|
21
|
+
}
|
|
22
|
+
this._uint8Array = bytes;
|
|
23
|
+
}
|
|
24
|
+
return this._uint8Array;
|
|
25
|
+
}
|
|
26
|
+
get base64() {
|
|
27
|
+
if (this._base64 != null)
|
|
28
|
+
return this._base64;
|
|
29
|
+
if (typeof this._data === 'string') {
|
|
30
|
+
this._base64 = this._data;
|
|
31
|
+
}
|
|
32
|
+
else {
|
|
33
|
+
let binaryString = '';
|
|
34
|
+
for (let i = 0; i < this._data.length; i++) {
|
|
35
|
+
binaryString += String.fromCharCode(this._data[i]);
|
|
36
|
+
}
|
|
37
|
+
this._base64 = btoa(binaryString);
|
|
38
|
+
}
|
|
39
|
+
return this._base64;
|
|
40
|
+
}
|
|
41
|
+
}
|
|
42
|
+
//# sourceMappingURL=speech-result.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"speech-result.js","sourceRoot":"","sources":["../src/speech-result.ts"],"names":[],"mappings":"AAWA,MAAM,OAAO,yBAAyB;IAC3B,SAAS,CAAS;IAEnB,KAAK,CAAsB;IAC3B,WAAW,CAAc;IACzB,OAAO,CAAU;IAEzB,YAAY,EAAE,IAAI,EAAE,SAAS,EAAoD;QAC/E,IAAI,CAAC,KAAK,GAAG,IAAI,CAAC;QAClB,IAAI,CAAC,SAAS,GAAG,SAAS,CAAC;IAC7B,CAAC;IAED,IAAI,UAAU;QACZ,IAAI,IAAI,CAAC,WAAW,IAAI,IAAI;YAAE,OAAO,IAAI,CAAC,WAAW,CAAC;QACtD,IAAI,IAAI,CAAC,KAAK,YAAY,UAAU,EAAE,CAAC;YACrC,IAAI,CAAC,WAAW,GAAG,IAAI,CAAC,KAAK,CAAC;QAChC,CAAC;aAAM,CAAC;YACN,MAAM,YAAY,GAAG,IAAI,CAAC,IAAI,CAAC,KAAK,CAAC,CAAC;YACtC,MAAM,KAAK,GAAG,IAAI,UAAU,CAAC,YAAY,CAAC,MAAM,CAAC,CAAC;YAClD,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,GAAG,YAAY,CAAC,MAAM,EAAE,CAAC,EAAE,EAAE,CAAC;gBAC7C,KAAK,CAAC,CAAC,CAAC,GAAG,YAAY,CAAC,UAAU,CAAC,CAAC,CAAC,CAAC;YACxC,CAAC;YACD,IAAI,CAAC,WAAW,GAAG,KAAK,CAAC;QAC3B,CAAC;QACD,OAAO,IAAI,CAAC,WAAW,CAAC;IAC1B,CAAC;IAED,IAAI,MAAM;QACR,IAAI,IAAI,CAAC,OAAO,IAAI,IAAI;YAAE,OAAO,IAAI,CAAC,OAAO,CAAC;QAC9C,IAAI,OAAO,IAAI,CAAC,KAAK,KAAK,QAAQ,EAAE,CAAC;YACnC,IAAI,CAAC,OAAO,GAAG,IAAI,CAAC,KAAK,CAAC;QAC5B,CAAC;aAAM,CAAC;YACN,IAAI,YAAY,GAAG,EAAE,CAAC;YACtB,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,GAAG,IAAI,CAAC,KAAK,CAAC,MAAM,EAAE,CAAC,EAAE,EAAE,CAAC;gBAC3C,YAAY,IAAI,MAAM,CAAC,YAAY,CAAC,IAAI,CAAC,KAAK,CAAC,CAAC,CAAC,CAAC,CAAC;YACrD,CAAC;YACD,IAAI,CAAC,OAAO,GAAG,IAAI,CAAC,YAAY,CAAC,CAAC;QACpC,CAAC;QACD,OAAO,IAAI,CAAC,OAAO,CAAC;IACtB,CAAC;CACF"}
|
package/dist/types.d.ts
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
1
|
+
import type { ResolvedModel, Voice } from './speech-provider.js';
|
|
2
|
+
export type GenerateSpeechOptions<V extends Voice = Voice> = {
|
|
3
|
+
model: string | ResolvedModel<V>;
|
|
4
|
+
text: string;
|
|
5
|
+
voice: V;
|
|
6
|
+
providerOptions?: Record<string, unknown>;
|
|
7
|
+
maxRetries?: number;
|
|
8
|
+
abortSignal?: AbortSignal;
|
|
9
|
+
headers?: Record<string, string>;
|
|
10
|
+
};
|
|
11
|
+
//# sourceMappingURL=types.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"types.d.ts","sourceRoot":"","sources":["../src/types.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,EAAE,aAAa,EAAE,KAAK,EAAE,MAAM,sBAAsB,CAAC;AAEjE,MAAM,MAAM,qBAAqB,CAAC,CAAC,SAAS,KAAK,GAAG,KAAK,IAAI;IAC3D,KAAK,EAAE,MAAM,GAAG,aAAa,CAAC,CAAC,CAAC,CAAC;IACjC,IAAI,EAAE,MAAM,CAAC;IACb,KAAK,EAAE,CAAC,CAAC;IACT,eAAe,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,OAAO,CAAC,CAAC;IAC1C,UAAU,CAAC,EAAE,MAAM,CAAC;IACpB,WAAW,CAAC,EAAE,WAAW,CAAC;IAC1B,OAAO,CAAC,EAAE,MAAM,CAAC,MAAM,EAAE,MAAM,CAAC,CAAC;CAClC,CAAC"}
|
package/dist/types.js
ADDED
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"types.js","sourceRoot":"","sources":["../src/types.ts"],"names":[],"mappings":""}
|
package/package.json
ADDED
|
@@ -0,0 +1,96 @@
|
|
|
1
|
+
{
|
|
2
|
+
"name": "@speech-sdk/core",
|
|
3
|
+
"version": "0.0.1",
|
|
4
|
+
"description": "Universal, cross-platform text-to-speech SDK with multi-provider support.",
|
|
5
|
+
"type": "module",
|
|
6
|
+
"packageManager": "pnpm@10.11.1",
|
|
7
|
+
"main": "./dist/index.js",
|
|
8
|
+
"types": "./dist/index.d.ts",
|
|
9
|
+
"exports": {
|
|
10
|
+
".": {
|
|
11
|
+
"types": "./dist/index.d.ts",
|
|
12
|
+
"default": "./dist/index.js"
|
|
13
|
+
},
|
|
14
|
+
"./openai": {
|
|
15
|
+
"types": "./dist/providers/openai/index.d.ts",
|
|
16
|
+
"default": "./dist/providers/openai/index.js"
|
|
17
|
+
},
|
|
18
|
+
"./elevenlabs": {
|
|
19
|
+
"types": "./dist/providers/elevenlabs/index.d.ts",
|
|
20
|
+
"default": "./dist/providers/elevenlabs/index.js"
|
|
21
|
+
},
|
|
22
|
+
"./deepgram": {
|
|
23
|
+
"types": "./dist/providers/deepgram/index.d.ts",
|
|
24
|
+
"default": "./dist/providers/deepgram/index.js"
|
|
25
|
+
},
|
|
26
|
+
"./cartesia": {
|
|
27
|
+
"types": "./dist/providers/cartesia/index.d.ts",
|
|
28
|
+
"default": "./dist/providers/cartesia/index.js"
|
|
29
|
+
},
|
|
30
|
+
"./hume": {
|
|
31
|
+
"types": "./dist/providers/hume/index.d.ts",
|
|
32
|
+
"default": "./dist/providers/hume/index.js"
|
|
33
|
+
},
|
|
34
|
+
"./google": {
|
|
35
|
+
"types": "./dist/providers/google/index.d.ts",
|
|
36
|
+
"default": "./dist/providers/google/index.js"
|
|
37
|
+
},
|
|
38
|
+
"./fish-audio": {
|
|
39
|
+
"types": "./dist/providers/fish-audio/index.d.ts",
|
|
40
|
+
"default": "./dist/providers/fish-audio/index.js"
|
|
41
|
+
},
|
|
42
|
+
"./unreal-speech": {
|
|
43
|
+
"types": "./dist/providers/unreal-speech/index.d.ts",
|
|
44
|
+
"default": "./dist/providers/unreal-speech/index.js"
|
|
45
|
+
},
|
|
46
|
+
"./murf": {
|
|
47
|
+
"types": "./dist/providers/murf/index.d.ts",
|
|
48
|
+
"default": "./dist/providers/murf/index.js"
|
|
49
|
+
},
|
|
50
|
+
"./resemble": {
|
|
51
|
+
"types": "./dist/providers/resemble/index.d.ts",
|
|
52
|
+
"default": "./dist/providers/resemble/index.js"
|
|
53
|
+
},
|
|
54
|
+
"./fal-ai": {
|
|
55
|
+
"types": "./dist/providers/fal/index.d.ts",
|
|
56
|
+
"default": "./dist/providers/fal/index.js"
|
|
57
|
+
},
|
|
58
|
+
"./mistral": {
|
|
59
|
+
"types": "./dist/providers/mistral/index.d.ts",
|
|
60
|
+
"default": "./dist/providers/mistral/index.js"
|
|
61
|
+
}
|
|
62
|
+
},
|
|
63
|
+
"files": [
|
|
64
|
+
"dist",
|
|
65
|
+
"README.md"
|
|
66
|
+
],
|
|
67
|
+
"scripts": {
|
|
68
|
+
"build": "tsc",
|
|
69
|
+
"test": "vitest run",
|
|
70
|
+
"test:watch": "vitest",
|
|
71
|
+
"test:e2e": "vitest run --config vitest.config.e2e.ts",
|
|
72
|
+
"typecheck": "tsc --noEmit"
|
|
73
|
+
},
|
|
74
|
+
"keywords": [
|
|
75
|
+
"tts",
|
|
76
|
+
"text-to-speech",
|
|
77
|
+
"speech",
|
|
78
|
+
"openai",
|
|
79
|
+
"elevenlabs",
|
|
80
|
+
"ai"
|
|
81
|
+
],
|
|
82
|
+
"license": "MIT",
|
|
83
|
+
"repository": {
|
|
84
|
+
"type": "git",
|
|
85
|
+
"url": "https://github.com/Jellypod-Inc/speech-sdk"
|
|
86
|
+
},
|
|
87
|
+
"dependencies": {
|
|
88
|
+
"p-retry": "^8.0.0"
|
|
89
|
+
},
|
|
90
|
+
"devDependencies": {
|
|
91
|
+
"@types/node": "^25.5.0",
|
|
92
|
+
"dotenv": "^17.3.1",
|
|
93
|
+
"typescript": "^5.8.0",
|
|
94
|
+
"vitest": "^3.1.0"
|
|
95
|
+
}
|
|
96
|
+
}
|