@livekit/agents-plugin-openai 0.6.1 → 0.7.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +18 -0
- package/dist/index.cjs +55 -0
- package/dist/index.cjs.map +1 -0
- package/dist/index.js +13 -8
- package/dist/index.js.map +1 -1
- package/dist/llm.cjs +502 -0
- package/dist/llm.cjs.map +1 -0
- package/dist/llm.js +435 -424
- package/dist/llm.js.map +1 -1
- package/dist/models.cjs +17 -0
- package/dist/models.cjs.map +1 -0
- package/dist/models.js +0 -4
- package/dist/models.js.map +1 -1
- package/dist/realtime/api_proto.cjs +41 -0
- package/dist/realtime/api_proto.cjs.map +1 -0
- package/dist/realtime/api_proto.js +12 -8
- package/dist/realtime/api_proto.js.map +1 -1
- package/dist/realtime/index.cjs +25 -0
- package/dist/realtime/index.cjs.map +1 -0
- package/dist/realtime/index.js +2 -5
- package/dist/realtime/index.js.map +1 -1
- package/dist/realtime/realtime_model.cjs +878 -0
- package/dist/realtime/realtime_model.cjs.map +1 -0
- package/dist/realtime/realtime_model.js +828 -777
- package/dist/realtime/realtime_model.js.map +1 -1
- package/dist/stt.cjs +130 -0
- package/dist/stt.cjs.map +1 -0
- package/dist/stt.js +99 -102
- package/dist/stt.js.map +1 -1
- package/dist/tts.cjs +100 -0
- package/dist/tts.cjs.map +1 -0
- package/dist/tts.d.ts +1 -1
- package/dist/tts.d.ts.map +1 -1
- package/dist/tts.js +67 -65
- package/dist/tts.js.map +1 -1
- package/package.json +18 -8
- package/src/tts.ts +2 -1
package/dist/tts.cjs
ADDED
|
@@ -0,0 +1,100 @@
|
|
|
1
|
+
"use strict";
|
|
2
|
+
var __defProp = Object.defineProperty;
|
|
3
|
+
var __getOwnPropDesc = Object.getOwnPropertyDescriptor;
|
|
4
|
+
var __getOwnPropNames = Object.getOwnPropertyNames;
|
|
5
|
+
var __hasOwnProp = Object.prototype.hasOwnProperty;
|
|
6
|
+
var __export = (target, all) => {
|
|
7
|
+
for (var name in all)
|
|
8
|
+
__defProp(target, name, { get: all[name], enumerable: true });
|
|
9
|
+
};
|
|
10
|
+
var __copyProps = (to, from, except, desc) => {
|
|
11
|
+
if (from && typeof from === "object" || typeof from === "function") {
|
|
12
|
+
for (let key of __getOwnPropNames(from))
|
|
13
|
+
if (!__hasOwnProp.call(to, key) && key !== except)
|
|
14
|
+
__defProp(to, key, { get: () => from[key], enumerable: !(desc = __getOwnPropDesc(from, key)) || desc.enumerable });
|
|
15
|
+
}
|
|
16
|
+
return to;
|
|
17
|
+
};
|
|
18
|
+
var __toCommonJS = (mod) => __copyProps(__defProp({}, "__esModule", { value: true }), mod);
|
|
19
|
+
var tts_exports = {};
|
|
20
|
+
__export(tts_exports, {
|
|
21
|
+
ChunkedStream: () => ChunkedStream,
|
|
22
|
+
TTS: () => TTS
|
|
23
|
+
});
|
|
24
|
+
module.exports = __toCommonJS(tts_exports);
|
|
25
|
+
var import_agents = require("@livekit/agents");
|
|
26
|
+
var import_openai = require("openai");
|
|
27
|
+
const OPENAI_TTS_SAMPLE_RATE = 24e3;
|
|
28
|
+
const OPENAI_TTS_CHANNELS = 1;
|
|
29
|
+
const defaultTTSOptions = {
|
|
30
|
+
apiKey: process.env.OPENAI_API_KEY,
|
|
31
|
+
model: "tts-1",
|
|
32
|
+
voice: "alloy",
|
|
33
|
+
speed: 1
|
|
34
|
+
};
|
|
35
|
+
class TTS extends import_agents.tts.TTS {
|
|
36
|
+
#opts;
|
|
37
|
+
#client;
|
|
38
|
+
/**
|
|
39
|
+
* Create a new instance of OpenAI TTS.
|
|
40
|
+
*
|
|
41
|
+
* @remarks
|
|
42
|
+
* `apiKey` must be set to your OpenAI API key, either using the argument or by setting the
|
|
43
|
+
* `OPENAI_API_KEY` environmental variable.
|
|
44
|
+
*/
|
|
45
|
+
constructor(opts = defaultTTSOptions) {
|
|
46
|
+
super(OPENAI_TTS_SAMPLE_RATE, OPENAI_TTS_CHANNELS, { streaming: false });
|
|
47
|
+
this.#opts = { ...defaultTTSOptions, ...opts };
|
|
48
|
+
if (this.#opts.apiKey === void 0) {
|
|
49
|
+
throw new Error("OpenAI API key is required, whether as an argument or as $OPENAI_API_KEY");
|
|
50
|
+
}
|
|
51
|
+
this.#client = this.#opts.client || new import_openai.OpenAI({
|
|
52
|
+
baseURL: opts.baseURL,
|
|
53
|
+
apiKey: opts.apiKey
|
|
54
|
+
});
|
|
55
|
+
}
|
|
56
|
+
updateOptions(opts) {
|
|
57
|
+
this.#opts = { ...this.#opts, ...opts };
|
|
58
|
+
}
|
|
59
|
+
synthesize(text) {
|
|
60
|
+
return new ChunkedStream(
|
|
61
|
+
this.#client.audio.speech.create({
|
|
62
|
+
input: text,
|
|
63
|
+
model: this.#opts.model,
|
|
64
|
+
voice: this.#opts.voice,
|
|
65
|
+
response_format: "pcm",
|
|
66
|
+
speed: this.#opts.speed
|
|
67
|
+
})
|
|
68
|
+
);
|
|
69
|
+
}
|
|
70
|
+
stream() {
|
|
71
|
+
throw new Error("Streaming is not supported on OpenAI TTS");
|
|
72
|
+
}
|
|
73
|
+
}
|
|
74
|
+
class ChunkedStream extends import_agents.tts.ChunkedStream {
|
|
75
|
+
// set Promise<T> to any because OpenAI returns an annoying Response type
|
|
76
|
+
constructor(stream) {
|
|
77
|
+
super();
|
|
78
|
+
this.#run(stream);
|
|
79
|
+
}
|
|
80
|
+
async #run(stream) {
|
|
81
|
+
const buffer = await stream.then((r) => r.arrayBuffer());
|
|
82
|
+
const requestId = crypto.randomUUID();
|
|
83
|
+
const audioByteStream = new import_agents.AudioByteStream(OPENAI_TTS_SAMPLE_RATE, OPENAI_TTS_CHANNELS);
|
|
84
|
+
const frames = audioByteStream.write(buffer);
|
|
85
|
+
for (const frame of frames) {
|
|
86
|
+
this.queue.put({
|
|
87
|
+
frame,
|
|
88
|
+
requestId,
|
|
89
|
+
segmentId: requestId
|
|
90
|
+
});
|
|
91
|
+
}
|
|
92
|
+
this.queue.close();
|
|
93
|
+
}
|
|
94
|
+
}
|
|
95
|
+
// Annotate the CommonJS export names for ESM import in node:
|
|
96
|
+
0 && (module.exports = {
|
|
97
|
+
ChunkedStream,
|
|
98
|
+
TTS
|
|
99
|
+
});
|
|
100
|
+
//# sourceMappingURL=tts.cjs.map
|
package/dist/tts.cjs.map
ADDED
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"sources":["../src/tts.ts"],"sourcesContent":["// SPDX-FileCopyrightText: 2024 LiveKit, Inc.\n//\n// SPDX-License-Identifier: Apache-2.0\nimport { AudioByteStream, tts } from '@livekit/agents';\nimport { OpenAI } from 'openai';\nimport type { TTSModels, TTSVoices } from './models.js';\n\nconst OPENAI_TTS_SAMPLE_RATE = 24000;\nconst OPENAI_TTS_CHANNELS = 1;\n\nexport interface TTSOptions {\n model: TTSModels | string;\n voice: TTSVoices;\n speed: number;\n baseURL?: string;\n client?: OpenAI;\n apiKey?: string;\n}\n\nconst defaultTTSOptions: TTSOptions = {\n apiKey: process.env.OPENAI_API_KEY,\n model: 'tts-1',\n voice: 'alloy',\n speed: 1,\n};\n\nexport class TTS extends tts.TTS {\n #opts: TTSOptions;\n #client: OpenAI;\n\n /**\n * Create a new instance of OpenAI TTS.\n *\n * @remarks\n * `apiKey` must be set to your OpenAI API key, either using the argument or by setting the\n * `OPENAI_API_KEY` environmental variable.\n */\n constructor(opts: Partial<TTSOptions> = defaultTTSOptions) {\n super(OPENAI_TTS_SAMPLE_RATE, OPENAI_TTS_CHANNELS, { streaming: false });\n\n this.#opts = { ...defaultTTSOptions, ...opts };\n if (this.#opts.apiKey === undefined) {\n throw new Error('OpenAI API key is required, whether as an argument or as $OPENAI_API_KEY');\n }\n\n this.#client =\n this.#opts.client ||\n new OpenAI({\n baseURL: opts.baseURL,\n apiKey: opts.apiKey,\n });\n }\n\n updateOptions(opts: { model?: TTSModels | string; voice?: TTSVoices; speed?: number }) {\n this.#opts = { ...this.#opts, ...opts };\n }\n\n synthesize(text: string): ChunkedStream {\n return new ChunkedStream(\n this.#client.audio.speech.create({\n input: text,\n model: this.#opts.model,\n voice: this.#opts.voice,\n response_format: 'pcm',\n speed: this.#opts.speed,\n }),\n );\n }\n\n stream(): tts.SynthesizeStream {\n throw new Error('Streaming is not supported on OpenAI TTS');\n }\n}\n\nexport class ChunkedStream extends tts.ChunkedStream {\n // set Promise<T> to any because OpenAI returns an annoying Response type\n constructor(stream: Promise<any>) {\n super();\n this.#run(stream);\n }\n\n async #run(stream: Promise<Response>) {\n const buffer = await stream.then((r) => r.arrayBuffer());\n const requestId = crypto.randomUUID();\n const audioByteStream = new AudioByteStream(OPENAI_TTS_SAMPLE_RATE, OPENAI_TTS_CHANNELS);\n const frames = audioByteStream.write(buffer);\n\n for (const frame of frames) {\n this.queue.put({\n frame,\n requestId,\n segmentId: requestId,\n });\n }\n this.queue.close();\n }\n}\n"],"mappings":";;;;;;;;;;;;;;;;;;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAGA,oBAAqC;AACrC,oBAAuB;AAGvB,MAAM,yBAAyB;AAC/B,MAAM,sBAAsB;AAW5B,MAAM,oBAAgC;AAAA,EACpC,QAAQ,QAAQ,IAAI;AAAA,EACpB,OAAO;AAAA,EACP,OAAO;AAAA,EACP,OAAO;AACT;AAEO,MAAM,YAAY,kBAAI,IAAI;AAAA,EAC/B;AAAA,EACA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA,EASA,YAAY,OAA4B,mBAAmB;AACzD,UAAM,wBAAwB,qBAAqB,EAAE,WAAW,MAAM,CAAC;AAEvE,SAAK,QAAQ,EAAE,GAAG,mBAAmB,GAAG,KAAK;AAC7C,QAAI,KAAK,MAAM,WAAW,QAAW;AACnC,YAAM,IAAI,MAAM,0EAA0E;AAAA,IAC5F;AAEA,SAAK,UACH,KAAK,MAAM,UACX,IAAI,qBAAO;AAAA,MACT,SAAS,KAAK;AAAA,MACd,QAAQ,KAAK;AAAA,IACf,CAAC;AAAA,EACL;AAAA,EAEA,cAAc,MAAyE;AACrF,SAAK,QAAQ,EAAE,GAAG,KAAK,OAAO,GAAG,KAAK;AAAA,EACxC;AAAA,EAEA,WAAW,MAA6B;AACtC,WAAO,IAAI;AAAA,MACT,KAAK,QAAQ,MAAM,OAAO,OAAO;AAAA,QAC/B,OAAO;AAAA,QACP,OAAO,KAAK,MAAM;AAAA,QAClB,OAAO,KAAK,MAAM;AAAA,QAClB,iBAAiB;AAAA,QACjB,OAAO,KAAK,MAAM;AAAA,MACpB,CAAC;AAAA,IACH;AAAA,EACF;AAAA,EAEA,SAA+B;AAC7B,UAAM,IAAI,MAAM,0CAA0C;AAAA,EAC5D;AACF;AAEO,MAAM,sBAAsB,kBAAI,cAAc;AAAA;AAAA,EAEnD,YAAY,QAAsB;AAChC,UAAM;AACN,SAAK,KAAK,MAAM;AAAA,EAClB;AAAA,EAEA,MAAM,KAAK,QAA2B;AACpC,UAAM,SAAS,MAAM,OAAO,KAAK,CAAC,MAAM,EAAE,YAAY,CAAC;AACvD,UAAM,YAAY,OAAO,WAAW;AACpC,UAAM,kBAAkB,IAAI,8BAAgB,wBAAwB,mBAAmB;AACvF,UAAM,SAAS,gBAAgB,MAAM,MAAM;AAE3C,eAAW,SAAS,QAAQ;AAC1B,WAAK,MAAM,IAAI;AAAA,QACb;AAAA,QACA;AAAA,QACA,WAAW;AAAA,MACb,CAAC;AAAA,IACH;AACA,SAAK,MAAM,MAAM;AAAA,EACnB;AACF;","names":[]}
|
package/dist/tts.d.ts
CHANGED
package/dist/tts.d.ts.map
CHANGED
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"tts.d.ts","sourceRoot":"","sources":["../src/tts.ts"],"names":[],"mappings":"AAGA,OAAO,EAAmB,GAAG,EAAE,MAAM,iBAAiB,CAAC;AACvD,OAAO,EAAE,MAAM,EAAE,MAAM,QAAQ,CAAC;AAChC,OAAO,KAAK,EAAE,SAAS,EAAE,SAAS,EAAE,MAAM,aAAa,CAAC;AAKxD,MAAM,WAAW,UAAU;IACzB,KAAK,EAAE,SAAS,GAAG,MAAM,CAAC;IAC1B,KAAK,EAAE,SAAS,CAAC;IACjB,KAAK,EAAE,MAAM,CAAC;IACd,OAAO,CAAC,EAAE,MAAM,CAAC;IACjB,MAAM,CAAC,EAAE,MAAM,CAAC;IAChB,MAAM,CAAC,EAAE,MAAM,CAAC;CACjB;AASD,qBAAa,GAAI,SAAQ,GAAG,CAAC,GAAG;;IAI9B;;;;;;OAMG;gBACS,IAAI,GAAE,OAAO,CAAC,UAAU,CAAqB;IAgBzD,aAAa,CAAC,IAAI,EAAE;QAAE,KAAK,CAAC,EAAE,SAAS,GAAG,MAAM,CAAC;QAAC,KAAK,CAAC,EAAE,SAAS,CAAC;QAAC,KAAK,CAAC,EAAE,MAAM,CAAA;KAAE;IAIrF,UAAU,CAAC,IAAI,EAAE,MAAM,GAAG,aAAa;IAYvC,MAAM,IAAI,GAAG,CAAC,gBAAgB;CAG/B;AAED,qBAAa,aAAc,SAAQ,GAAG,CAAC,aAAa;;
|
|
1
|
+
{"version":3,"file":"tts.d.ts","sourceRoot":"","sources":["../src/tts.ts"],"names":[],"mappings":"AAGA,OAAO,EAAmB,GAAG,EAAE,MAAM,iBAAiB,CAAC;AACvD,OAAO,EAAE,MAAM,EAAE,MAAM,QAAQ,CAAC;AAChC,OAAO,KAAK,EAAE,SAAS,EAAE,SAAS,EAAE,MAAM,aAAa,CAAC;AAKxD,MAAM,WAAW,UAAU;IACzB,KAAK,EAAE,SAAS,GAAG,MAAM,CAAC;IAC1B,KAAK,EAAE,SAAS,CAAC;IACjB,KAAK,EAAE,MAAM,CAAC;IACd,OAAO,CAAC,EAAE,MAAM,CAAC;IACjB,MAAM,CAAC,EAAE,MAAM,CAAC;IAChB,MAAM,CAAC,EAAE,MAAM,CAAC;CACjB;AASD,qBAAa,GAAI,SAAQ,GAAG,CAAC,GAAG;;IAI9B;;;;;;OAMG;gBACS,IAAI,GAAE,OAAO,CAAC,UAAU,CAAqB;IAgBzD,aAAa,CAAC,IAAI,EAAE;QAAE,KAAK,CAAC,EAAE,SAAS,GAAG,MAAM,CAAC;QAAC,KAAK,CAAC,EAAE,SAAS,CAAC;QAAC,KAAK,CAAC,EAAE,MAAM,CAAA;KAAE;IAIrF,UAAU,CAAC,IAAI,EAAE,MAAM,GAAG,aAAa;IAYvC,MAAM,IAAI,GAAG,CAAC,gBAAgB;CAG/B;AAED,qBAAa,aAAc,SAAQ,GAAG,CAAC,aAAa;;gBAEtC,MAAM,EAAE,OAAO,CAAC,GAAG,CAAC;CAoBjC"}
|
package/dist/tts.js
CHANGED
|
@@ -1,73 +1,75 @@
|
|
|
1
|
-
|
|
2
|
-
|
|
3
|
-
|
|
4
|
-
import { AudioByteStream, tts } from '@livekit/agents';
|
|
5
|
-
import { OpenAI } from 'openai';
|
|
6
|
-
const OPENAI_TTS_SAMPLE_RATE = 24000;
|
|
1
|
+
import { AudioByteStream, tts } from "@livekit/agents";
|
|
2
|
+
import { OpenAI } from "openai";
|
|
3
|
+
const OPENAI_TTS_SAMPLE_RATE = 24e3;
|
|
7
4
|
const OPENAI_TTS_CHANNELS = 1;
|
|
8
5
|
const defaultTTSOptions = {
|
|
9
|
-
|
|
10
|
-
|
|
11
|
-
|
|
12
|
-
|
|
6
|
+
apiKey: process.env.OPENAI_API_KEY,
|
|
7
|
+
model: "tts-1",
|
|
8
|
+
voice: "alloy",
|
|
9
|
+
speed: 1
|
|
13
10
|
};
|
|
14
|
-
|
|
15
|
-
|
|
16
|
-
|
|
17
|
-
|
|
18
|
-
|
|
19
|
-
|
|
20
|
-
|
|
21
|
-
|
|
22
|
-
|
|
23
|
-
|
|
24
|
-
|
|
25
|
-
|
|
26
|
-
|
|
27
|
-
|
|
28
|
-
|
|
29
|
-
}
|
|
30
|
-
this.#client =
|
|
31
|
-
this.#opts.client ||
|
|
32
|
-
new OpenAI({
|
|
33
|
-
baseURL: opts.baseURL,
|
|
34
|
-
apiKey: opts.apiKey,
|
|
35
|
-
});
|
|
36
|
-
}
|
|
37
|
-
updateOptions(opts) {
|
|
38
|
-
this.#opts = { ...this.#opts, ...opts };
|
|
39
|
-
}
|
|
40
|
-
synthesize(text) {
|
|
41
|
-
return new ChunkedStream(this.#client.audio.speech.create({
|
|
42
|
-
input: text,
|
|
43
|
-
model: this.#opts.model,
|
|
44
|
-
voice: this.#opts.voice,
|
|
45
|
-
response_format: 'pcm',
|
|
46
|
-
speed: this.#opts.speed,
|
|
47
|
-
}));
|
|
48
|
-
}
|
|
49
|
-
stream() {
|
|
50
|
-
throw new Error('Streaming is not supported on OpenAI TTS');
|
|
11
|
+
class TTS extends tts.TTS {
|
|
12
|
+
#opts;
|
|
13
|
+
#client;
|
|
14
|
+
/**
|
|
15
|
+
* Create a new instance of OpenAI TTS.
|
|
16
|
+
*
|
|
17
|
+
* @remarks
|
|
18
|
+
* `apiKey` must be set to your OpenAI API key, either using the argument or by setting the
|
|
19
|
+
* `OPENAI_API_KEY` environmental variable.
|
|
20
|
+
*/
|
|
21
|
+
constructor(opts = defaultTTSOptions) {
|
|
22
|
+
super(OPENAI_TTS_SAMPLE_RATE, OPENAI_TTS_CHANNELS, { streaming: false });
|
|
23
|
+
this.#opts = { ...defaultTTSOptions, ...opts };
|
|
24
|
+
if (this.#opts.apiKey === void 0) {
|
|
25
|
+
throw new Error("OpenAI API key is required, whether as an argument or as $OPENAI_API_KEY");
|
|
51
26
|
}
|
|
27
|
+
this.#client = this.#opts.client || new OpenAI({
|
|
28
|
+
baseURL: opts.baseURL,
|
|
29
|
+
apiKey: opts.apiKey
|
|
30
|
+
});
|
|
31
|
+
}
|
|
32
|
+
updateOptions(opts) {
|
|
33
|
+
this.#opts = { ...this.#opts, ...opts };
|
|
34
|
+
}
|
|
35
|
+
synthesize(text) {
|
|
36
|
+
return new ChunkedStream(
|
|
37
|
+
this.#client.audio.speech.create({
|
|
38
|
+
input: text,
|
|
39
|
+
model: this.#opts.model,
|
|
40
|
+
voice: this.#opts.voice,
|
|
41
|
+
response_format: "pcm",
|
|
42
|
+
speed: this.#opts.speed
|
|
43
|
+
})
|
|
44
|
+
);
|
|
45
|
+
}
|
|
46
|
+
stream() {
|
|
47
|
+
throw new Error("Streaming is not supported on OpenAI TTS");
|
|
48
|
+
}
|
|
52
49
|
}
|
|
53
|
-
|
|
54
|
-
|
|
55
|
-
|
|
56
|
-
|
|
57
|
-
|
|
58
|
-
|
|
59
|
-
|
|
60
|
-
|
|
61
|
-
|
|
62
|
-
|
|
63
|
-
|
|
64
|
-
|
|
65
|
-
|
|
66
|
-
|
|
67
|
-
|
|
68
|
-
|
|
69
|
-
|
|
70
|
-
this.queue.close();
|
|
50
|
+
class ChunkedStream extends tts.ChunkedStream {
|
|
51
|
+
// set Promise<T> to any because OpenAI returns an annoying Response type
|
|
52
|
+
constructor(stream) {
|
|
53
|
+
super();
|
|
54
|
+
this.#run(stream);
|
|
55
|
+
}
|
|
56
|
+
async #run(stream) {
|
|
57
|
+
const buffer = await stream.then((r) => r.arrayBuffer());
|
|
58
|
+
const requestId = crypto.randomUUID();
|
|
59
|
+
const audioByteStream = new AudioByteStream(OPENAI_TTS_SAMPLE_RATE, OPENAI_TTS_CHANNELS);
|
|
60
|
+
const frames = audioByteStream.write(buffer);
|
|
61
|
+
for (const frame of frames) {
|
|
62
|
+
this.queue.put({
|
|
63
|
+
frame,
|
|
64
|
+
requestId,
|
|
65
|
+
segmentId: requestId
|
|
66
|
+
});
|
|
71
67
|
}
|
|
68
|
+
this.queue.close();
|
|
69
|
+
}
|
|
72
70
|
}
|
|
71
|
+
export {
|
|
72
|
+
ChunkedStream,
|
|
73
|
+
TTS
|
|
74
|
+
};
|
|
73
75
|
//# sourceMappingURL=tts.js.map
|
package/dist/tts.js.map
CHANGED
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"
|
|
1
|
+
{"version":3,"sources":["../src/tts.ts"],"sourcesContent":["// SPDX-FileCopyrightText: 2024 LiveKit, Inc.\n//\n// SPDX-License-Identifier: Apache-2.0\nimport { AudioByteStream, tts } from '@livekit/agents';\nimport { OpenAI } from 'openai';\nimport type { TTSModels, TTSVoices } from './models.js';\n\nconst OPENAI_TTS_SAMPLE_RATE = 24000;\nconst OPENAI_TTS_CHANNELS = 1;\n\nexport interface TTSOptions {\n model: TTSModels | string;\n voice: TTSVoices;\n speed: number;\n baseURL?: string;\n client?: OpenAI;\n apiKey?: string;\n}\n\nconst defaultTTSOptions: TTSOptions = {\n apiKey: process.env.OPENAI_API_KEY,\n model: 'tts-1',\n voice: 'alloy',\n speed: 1,\n};\n\nexport class TTS extends tts.TTS {\n #opts: TTSOptions;\n #client: OpenAI;\n\n /**\n * Create a new instance of OpenAI TTS.\n *\n * @remarks\n * `apiKey` must be set to your OpenAI API key, either using the argument or by setting the\n * `OPENAI_API_KEY` environmental variable.\n */\n constructor(opts: Partial<TTSOptions> = defaultTTSOptions) {\n super(OPENAI_TTS_SAMPLE_RATE, OPENAI_TTS_CHANNELS, { streaming: false });\n\n this.#opts = { ...defaultTTSOptions, ...opts };\n if (this.#opts.apiKey === undefined) {\n throw new Error('OpenAI API key is required, whether as an argument or as $OPENAI_API_KEY');\n }\n\n this.#client =\n this.#opts.client ||\n new OpenAI({\n baseURL: opts.baseURL,\n apiKey: opts.apiKey,\n });\n }\n\n updateOptions(opts: { model?: TTSModels | string; voice?: TTSVoices; speed?: number }) {\n this.#opts = { ...this.#opts, ...opts };\n }\n\n synthesize(text: string): ChunkedStream {\n return new ChunkedStream(\n this.#client.audio.speech.create({\n input: text,\n model: this.#opts.model,\n voice: this.#opts.voice,\n response_format: 'pcm',\n speed: this.#opts.speed,\n }),\n );\n }\n\n stream(): tts.SynthesizeStream {\n throw new Error('Streaming is not supported on OpenAI TTS');\n }\n}\n\nexport class ChunkedStream extends tts.ChunkedStream {\n // set Promise<T> to any because OpenAI returns an annoying Response type\n constructor(stream: Promise<any>) {\n super();\n this.#run(stream);\n }\n\n async #run(stream: Promise<Response>) {\n const buffer = await stream.then((r) => r.arrayBuffer());\n const requestId = crypto.randomUUID();\n const audioByteStream = new AudioByteStream(OPENAI_TTS_SAMPLE_RATE, OPENAI_TTS_CHANNELS);\n const frames = audioByteStream.write(buffer);\n\n for (const frame of frames) {\n this.queue.put({\n frame,\n requestId,\n segmentId: requestId,\n });\n }\n this.queue.close();\n }\n}\n"],"mappings":"AAGA,SAAS,iBAAiB,WAAW;AACrC,SAAS,cAAc;AAGvB,MAAM,yBAAyB;AAC/B,MAAM,sBAAsB;AAW5B,MAAM,oBAAgC;AAAA,EACpC,QAAQ,QAAQ,IAAI;AAAA,EACpB,OAAO;AAAA,EACP,OAAO;AAAA,EACP,OAAO;AACT;AAEO,MAAM,YAAY,IAAI,IAAI;AAAA,EAC/B;AAAA,EACA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA;AAAA,EASA,YAAY,OAA4B,mBAAmB;AACzD,UAAM,wBAAwB,qBAAqB,EAAE,WAAW,MAAM,CAAC;AAEvE,SAAK,QAAQ,EAAE,GAAG,mBAAmB,GAAG,KAAK;AAC7C,QAAI,KAAK,MAAM,WAAW,QAAW;AACnC,YAAM,IAAI,MAAM,0EAA0E;AAAA,IAC5F;AAEA,SAAK,UACH,KAAK,MAAM,UACX,IAAI,OAAO;AAAA,MACT,SAAS,KAAK;AAAA,MACd,QAAQ,KAAK;AAAA,IACf,CAAC;AAAA,EACL;AAAA,EAEA,cAAc,MAAyE;AACrF,SAAK,QAAQ,EAAE,GAAG,KAAK,OAAO,GAAG,KAAK;AAAA,EACxC;AAAA,EAEA,WAAW,MAA6B;AACtC,WAAO,IAAI;AAAA,MACT,KAAK,QAAQ,MAAM,OAAO,OAAO;AAAA,QAC/B,OAAO;AAAA,QACP,OAAO,KAAK,MAAM;AAAA,QAClB,OAAO,KAAK,MAAM;AAAA,QAClB,iBAAiB;AAAA,QACjB,OAAO,KAAK,MAAM;AAAA,MACpB,CAAC;AAAA,IACH;AAAA,EACF;AAAA,EAEA,SAA+B;AAC7B,UAAM,IAAI,MAAM,0CAA0C;AAAA,EAC5D;AACF;AAEO,MAAM,sBAAsB,IAAI,cAAc;AAAA;AAAA,EAEnD,YAAY,QAAsB;AAChC,UAAM;AACN,SAAK,KAAK,MAAM;AAAA,EAClB;AAAA,EAEA,MAAM,KAAK,QAA2B;AACpC,UAAM,SAAS,MAAM,OAAO,KAAK,CAAC,MAAM,EAAE,YAAY,CAAC;AACvD,UAAM,YAAY,OAAO,WAAW;AACpC,UAAM,kBAAkB,IAAI,gBAAgB,wBAAwB,mBAAmB;AACvF,UAAM,SAAS,gBAAgB,MAAM,MAAM;AAE3C,eAAW,SAAS,QAAQ;AAC1B,WAAK,MAAM,IAAI;AAAA,QACb;AAAA,QACA;AAAA,QACA,WAAW;AAAA,MACb,CAAC;AAAA,IACH;AACA,SAAK,MAAM,MAAM;AAAA,EACnB;AACF;","names":[]}
|
package/package.json
CHANGED
|
@@ -1,23 +1,33 @@
|
|
|
1
1
|
{
|
|
2
2
|
"name": "@livekit/agents-plugin-openai",
|
|
3
|
-
"version": "0.
|
|
3
|
+
"version": "0.7.0",
|
|
4
4
|
"description": "OpenAI plugin for LiveKit Node Agents",
|
|
5
5
|
"main": "dist/index.js",
|
|
6
|
+
"require": "dist/index.cjs",
|
|
6
7
|
"types": "dist/index.d.ts",
|
|
8
|
+
"exports": {
|
|
9
|
+
".": {
|
|
10
|
+
"types": "./dist/index.d.ts",
|
|
11
|
+
"import": "./dist/index.js",
|
|
12
|
+
"require": "./dist/index.cjs"
|
|
13
|
+
}
|
|
14
|
+
},
|
|
7
15
|
"author": "LiveKit",
|
|
8
16
|
"type": "module",
|
|
9
17
|
"repository": "git@github.com:livekit/agents-js.git",
|
|
10
18
|
"license": "Apache-2.0",
|
|
11
19
|
"files": [
|
|
12
20
|
"dist",
|
|
13
|
-
"src"
|
|
21
|
+
"src",
|
|
22
|
+
"README.md"
|
|
14
23
|
],
|
|
15
24
|
"devDependencies": {
|
|
25
|
+
"@livekit/agents": "^x",
|
|
26
|
+
"@livekit/rtc-node": "^0.12.1",
|
|
16
27
|
"@microsoft/api-extractor": "^7.35.0",
|
|
17
|
-
"@livekit/rtc-node": "^0.11.1",
|
|
18
28
|
"@types/ws": "^8.5.10",
|
|
19
|
-
"
|
|
20
|
-
"
|
|
29
|
+
"tsup": "^8.3.5",
|
|
30
|
+
"typescript": "^5.0.0"
|
|
21
31
|
},
|
|
22
32
|
"dependencies": {
|
|
23
33
|
"openai": "^4.70.2",
|
|
@@ -25,11 +35,11 @@
|
|
|
25
35
|
"ws": "^8.16.0"
|
|
26
36
|
},
|
|
27
37
|
"peerDependencies": {
|
|
28
|
-
"@livekit/rtc-node": "^0.
|
|
29
|
-
"@livekit/agents": "^0.
|
|
38
|
+
"@livekit/rtc-node": "^0.12.1",
|
|
39
|
+
"@livekit/agents": "^0.5.0x"
|
|
30
40
|
},
|
|
31
41
|
"scripts": {
|
|
32
|
-
"build": "tsc
|
|
42
|
+
"build": "tsup --onSuccess \"tsc --declaration --emitDeclarationOnly\"",
|
|
33
43
|
"clean": "rm -rf dist",
|
|
34
44
|
"clean:build": "pnpm clean && pnpm build",
|
|
35
45
|
"lint": "eslint -f unix \"src/**/*.{ts,js}\"",
|
package/src/tts.ts
CHANGED
|
@@ -73,7 +73,8 @@ export class TTS extends tts.TTS {
|
|
|
73
73
|
}
|
|
74
74
|
|
|
75
75
|
export class ChunkedStream extends tts.ChunkedStream {
|
|
76
|
-
|
|
76
|
+
// set Promise<T> to any because OpenAI returns an annoying Response type
|
|
77
|
+
constructor(stream: Promise<any>) {
|
|
77
78
|
super();
|
|
78
79
|
this.#run(stream);
|
|
79
80
|
}
|