npm - @cartesia/cartesia-js - Versions diffs - 0.0.4-alpha.0 → 1.0.0-alpha.1 - Mend

@cartesia/cartesia-js 0.0.4-alpha.0 → 1.0.0-alpha.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (87) hide show

package/.turbo/turbo-build.log +64 -46
package/CHANGELOG.md +6 -0
package/README.md +123 -16
package/dist/{chunk-XPIMIAAE.js → chunk-3FL2SNIR.js} +1 -1
package/dist/chunk-3GBZUGUD.js +17 -0
package/dist/chunk-4RMSIQLG.js +25 -0
package/dist/chunk-BCQ63627.js +32 -0
package/dist/chunk-JOHSCOLW.js +106 -0
package/dist/chunk-LYPTISWL.js +75 -0
package/dist/chunk-NDNN326Q.js +207 -0
package/dist/chunk-WBK6LLXX.js +58 -0
package/dist/chunk-WE63M7PJ.js +119 -0
package/dist/{chunk-R4P7LWVZ.js → chunk-WIFMLPT5.js} +31 -6
package/dist/chunk-X7SJMF2R.js +22 -0
package/dist/index.cjs +391 -158
package/dist/index.d.cts +7 -3
package/dist/index.d.ts +7 -3
package/dist/index.js +13 -6
package/dist/lib/client.cjs +46 -0
package/dist/lib/client.d.cts +2 -0
package/dist/lib/client.d.ts +2 -0
package/dist/lib/client.js +3 -3
package/dist/lib/constants.cjs +11 -7
package/dist/lib/constants.d.cts +2 -3
package/dist/lib/constants.d.ts +2 -3
package/dist/lib/constants.js +4 -6
package/dist/lib/index.cjs +276 -163
package/dist/lib/index.d.cts +6 -2
package/dist/lib/index.d.ts +6 -2
package/dist/lib/index.js +9 -6
package/dist/react/index.cjs +524 -275
package/dist/react/index.d.cts +20 -14
package/dist/react/index.d.ts +20 -14
package/dist/react/index.js +142 -98
package/dist/react/utils.js +2 -2
package/dist/tts/index.cjs +470 -0
package/dist/tts/index.d.cts +17 -0
package/dist/tts/index.d.ts +17 -0
package/dist/tts/index.js +12 -0
package/dist/tts/player.cjs +198 -0
package/dist/tts/player.d.cts +43 -0
package/dist/tts/player.d.ts +43 -0
package/dist/tts/player.js +8 -0
package/dist/tts/source.cjs +167 -0
package/dist/tts/source.d.cts +53 -0
package/dist/tts/source.d.ts +53 -0
package/dist/tts/source.js +7 -0
package/dist/{audio → tts}/utils.cjs +12 -53
package/dist/tts/utils.d.cts +67 -0
package/dist/tts/utils.d.ts +67 -0
package/dist/{audio → tts}/utils.js +2 -7
package/dist/{audio/index.cjs → tts/websocket.cjs} +213 -164
package/dist/tts/websocket.d.cts +53 -0
package/dist/tts/websocket.d.ts +53 -0
package/dist/tts/websocket.js +11 -0
package/dist/types/index.d.cts +50 -1
package/dist/types/index.d.ts +50 -1
package/dist/voices/index.cjs +155 -0
package/dist/voices/index.d.cts +12 -0
package/dist/voices/index.d.ts +12 -0
package/dist/voices/index.js +9 -0
package/package.json +2 -1
package/src/index.ts +1 -0
package/src/lib/client.ts +14 -1
package/src/lib/constants.ts +13 -3
package/src/lib/index.ts +6 -3
package/src/react/index.ts +157 -103
package/src/tts/index.ts +17 -0
package/src/tts/player.ts +109 -0
package/src/tts/source.ts +98 -0
package/src/{audio → tts}/utils.ts +19 -97
package/src/tts/websocket.ts +210 -0
package/src/types/index.ts +63 -0
package/src/voices/index.ts +47 -0
package/dist/audio/index.d.cts +0 -5
package/dist/audio/index.d.ts +0 -5
package/dist/audio/index.js +0 -10
package/dist/audio/utils.d.cts +0 -5
package/dist/audio/utils.d.ts +0 -5
package/dist/chunk-4MHF74A7.js +0 -272
package/dist/chunk-5TSWLYOW.js +0 -113
package/dist/chunk-MJIFZWHS.js +0 -18
package/dist/chunk-OVI3W3GG.js +0 -12
package/dist/chunk-S6A27RQL.js +0 -18
package/dist/index-C2_3XFxn.d.cts +0 -163
package/dist/index-DgwnZezj.d.ts +0 -163
package/src/audio/index.ts +0 -297

package/dist/index.cjs CHANGED Viewed

@@ -1,15 +1,14 @@
 "use strict";
 var __create = Object.create;
 var __defProp = Object.defineProperty;
+var __defProps = Object.defineProperties;
 var __getOwnPropDesc = Object.getOwnPropertyDescriptor;
+var __getOwnPropDescs = Object.getOwnPropertyDescriptors;
 var __getOwnPropNames = Object.getOwnPropertyNames;
 var __getOwnPropSymbols = Object.getOwnPropertySymbols;
 var __getProtoOf = Object.getPrototypeOf;
 var __hasOwnProp = Object.prototype.hasOwnProperty;
 var __propIsEnum = Object.prototype.propertyIsEnumerable;
-var __knownSymbol = (name, symbol) => {
-  return (symbol = Symbol[name]) ? symbol : Symbol.for("Symbol." + name);
-};
 var __defNormalProp = (obj, key, value) => key in obj ? __defProp(obj, key, { enumerable: true, configurable: true, writable: true, value }) : obj[key] = value;
 var __spreadValues = (a, b) => {
   for (var prop in b || (b = {}))
@@ -22,6 +21,7 @@ var __spreadValues = (a, b) => {
     }
   return a;
 };
+var __spreadProps = (a, b) => __defProps(a, __getOwnPropDescs(b));
 var __export = (target, all) => {
   for (var name in all)
     __defProp(target, name, { get: all[name], enumerable: true });
@@ -43,6 +43,28 @@ var __toESM = (mod, isNodeMode, target) => (target = mod != null ? __create(__ge
   mod
 ));
 var __toCommonJS = (mod) => __copyProps(__defProp({}, "__esModule", { value: true }), mod);
+var __accessCheck = (obj, member, msg) => {
+  if (!member.has(obj))
+    throw TypeError("Cannot " + msg);
+};
+var __privateGet = (obj, member, getter) => {
+  __accessCheck(obj, member, "read from private field");
+  return getter ? getter.call(obj) : member.get(obj);
+};
+var __privateAdd = (obj, member, value) => {
+  if (member.has(obj))
+    throw TypeError("Cannot add the same private member more than once");
+  member instanceof WeakSet ? member.add(obj) : member.set(obj, value);
+};
+var __privateSet = (obj, member, value, setter) => {
+  __accessCheck(obj, member, "write to private field");
+  setter ? setter.call(obj, value) : member.set(obj, value);
+  return value;
+};
+var __privateMethod = (obj, member, method) => {
+  __accessCheck(obj, member, "access private method");
+  return method;
+};
 var __async = (__this, __arguments, generator) => {
   return new Promise((resolve, reject) => {
     var fulfilled = (value) => {
@@ -63,26 +85,30 @@ var __async = (__this, __arguments, generator) => {
     step((generator = generator.apply(__this, __arguments)).next());
   });
 };
-var __forAwait = (obj, it, method) => (it = obj[__knownSymbol("asyncIterator")]) ? it.call(obj) : (obj = obj[__knownSymbol("iterator")](), it = {}, method = (key, fn) => (fn = obj[key]) && (it[key] = (arg) => new Promise((yes, no, done) => (arg = fn.call(obj, arg), done = arg.done, Promise.resolve(arg.value).then((value) => yes({ value, done }), no)))), method("next"), method("return"), it);
 // src/index.ts
 var src_exports = {};
 __export(src_exports, {
   Cartesia: () => Cartesia,
+  WebPlayer: () => Player,
   default: () => Cartesia
 });
 module.exports = __toCommonJS(src_exports);
-// src/audio/index.ts
-var import_emittery = __toESM(require("emittery"), 1);
-var import_human_id = require("human-id");
-var import_partysocket = require("partysocket");
+// src/lib/client.ts
+var import_cross_fetch = __toESM(require("cross-fetch"), 1);
 // src/lib/constants.ts
 var BASE_URL = "https://api.cartesia.ai/v0";
-var SAMPLE_RATE = 44100;
-var constructWebsocketUrl = (baseUrl) => {
-  return new URL(`${baseUrl.replace(/^http/, "ws")}/audio/websocket`);
+var constructApiUrl = (baseUrl, path, protocol) => {
+  const normalizedPath = path.startsWith("/") ? path : `/${path}`;
+  if (!protocol) {
+    return new URL(`${baseUrl}${normalizedPath}`);
+  }
+  if (!["http", "ws"].includes(protocol)) {
+    throw new Error(`Invalid protocol: ${protocol}`);
+  }
+  return new URL(`${baseUrl.replace(/^http/, protocol)}${normalizedPath}`);
 };
 // src/lib/client.ts
@@ -94,14 +120,119 @@ var Client = class {
     this.apiKey = options.apiKey || process.env.CARTESIA_API_KEY;
     this.baseUrl = options.baseUrl || BASE_URL;
   }
+  fetch(path, options = {}) {
+    const url = constructApiUrl(this.baseUrl, path);
+    return (0, import_cross_fetch.default)(url.toString(), __spreadProps(__spreadValues({}, options), {
+      headers: __spreadValues({
+        "X-API-KEY": this.apiKey
+      }, options.headers)
+    }));
+  }
 };
-// src/audio/utils.ts
+// src/tts/websocket.ts
+var import_emittery2 = __toESM(require("emittery"), 1);
+var import_human_id = require("human-id");
+var import_partysocket = require("partysocket");
+// src/tts/source.ts
+var import_emittery = __toESM(require("emittery"), 1);
+var _emitter, _buffer, _readIndex, _closed, _sampleRate;
+var Source = class {
+  /**
+   * Create a new Source.
+   *
+   * @param options - Options for the Source.
+   * @param options.sampleRate - The sample rate of the audio.
+   */
+  constructor({ sampleRate }) {
+    __privateAdd(this, _emitter, new import_emittery.default());
+    __privateAdd(this, _buffer, new Float32Array());
+    __privateAdd(this, _readIndex, 0);
+    __privateAdd(this, _closed, false);
+    __privateAdd(this, _sampleRate, void 0);
+    this.on = __privateGet(this, _emitter).on.bind(__privateGet(this, _emitter));
+    this.once = __privateGet(this, _emitter).once.bind(__privateGet(this, _emitter));
+    this.events = __privateGet(this, _emitter).events.bind(__privateGet(this, _emitter));
+    this.off = __privateGet(this, _emitter).off.bind(__privateGet(this, _emitter));
+    __privateSet(this, _sampleRate, sampleRate);
+  }
+  get sampleRate() {
+    return __privateGet(this, _sampleRate);
+  }
+  /**
+   * Append audio to the buffer.
+   *
+   * @param src The audio to append.
+   */
+  enqueue(src) {
+    return __async(this, null, function* () {
+      __privateSet(this, _buffer, new Float32Array([...__privateGet(this, _buffer), ...src]));
+      yield __privateGet(this, _emitter).emit("enqueue");
+    });
+  }
+  /**
+   * Read audio from the buffer.
+   *
+   * @param dst The buffer to read the audio into.
+   * @returns The number of samples read. If the source is closed, this will be
+   * less than the length of the provided buffer.
+   */
+  read(dst) {
+    return __async(this, null, function* () {
+      const targetReadIndex = __privateGet(this, _readIndex) + dst.length;
+      while (!__privateGet(this, _closed) && targetReadIndex > __privateGet(this, _buffer).length) {
+        yield __privateGet(this, _emitter).emit("wait");
+        yield Promise.race([
+          __privateGet(this, _emitter).once("enqueue"),
+          __privateGet(this, _emitter).once("close")
+        ]);
+        yield __privateGet(this, _emitter).emit("read");
+      }
+      const read = Math.min(dst.length, __privateGet(this, _buffer).length - __privateGet(this, _readIndex));
+      dst.set(__privateGet(this, _buffer).slice(__privateGet(this, _readIndex), __privateGet(this, _readIndex) + read));
+      __privateSet(this, _readIndex, __privateGet(this, _readIndex) + read);
+      return read;
+    });
+  }
+  /**
+   * Get the number of samples in a given duration.
+   *
+   * @param durationSecs The duration in seconds.
+   * @returns The number of samples.
+   */
+  durationToSampleCount(durationSecs) {
+    return Math.trunc(durationSecs * __privateGet(this, _sampleRate));
+  }
+  get buffer() {
+    return __privateGet(this, _buffer);
+  }
+  get readIndex() {
+    return __privateGet(this, _readIndex);
+  }
+  /**
+   * Close the source. This signals that no more audio will be enqueued.
+   *
+   * This will emit a "close" event.
+   *
+   * @returns A promise that resolves when the source is closed.
+   */
+  close() {
+    return __async(this, null, function* () {
+      __privateSet(this, _closed, true);
+      yield __privateGet(this, _emitter).emit("close");
+      __privateGet(this, _emitter).clearListeners();
+    });
+  }
+};
+_emitter = new WeakMap();
+_buffer = new WeakMap();
+_readIndex = new WeakMap();
+_closed = new WeakMap();
+_sampleRate = new WeakMap();
+// src/tts/utils.ts
 var import_base64_js = __toESM(require("base64-js"), 1);
-function getBufferDuration(b64) {
-  const floats = base64ToArray(b64);
-  return floats.length / SAMPLE_RATE;
-}
 function base64ToArray(b64) {
   return filterSentinel(b64).reduce((acc, b) => {
     const floats = new Float32Array(import_base64_js.default.toByteArray(b).buffer);
@@ -111,20 +242,24 @@ function base64ToArray(b64) {
     return newAcc;
   }, new Float32Array(0));
 }
-function playAudioBuffer(b64, context, maybeStartAt = null, onEnded = null) {
-  const startAt = maybeStartAt != null ? maybeStartAt : context.currentTime;
-  const floats = base64ToArray(b64);
+function playAudioBuffer(floats, context, startAt, sampleRate) {
   const source = context.createBufferSource();
-  const buffer = context.createBuffer(1, floats.length, SAMPLE_RATE);
+  const buffer = context.createBuffer(1, floats.length, sampleRate);
   buffer.getChannelData(0).set(floats);
   source.buffer = buffer;
   source.connect(context.destination);
   source.start(startAt);
-  source.onended = onEnded;
-  return buffer.duration;
+  return new Promise((resolve) => {
+    source.onended = () => {
+      resolve();
+    };
+  });
 }
 function createMessageHandlerForContextId(contextId, handler) {
   return (event) => {
+    if (typeof event.data !== "string") {
+      return;
+    }
     const message = JSON.parse(event.data);
     if (message.context_id !== contextId) {
       return;
@@ -135,7 +270,7 @@ function createMessageHandlerForContextId(contextId, handler) {
     } else {
       chunk = message.data;
     }
-    handler({ chunk, message });
+    handler({ chunk, message: event.data });
   };
 }
 function getSentinel() {
@@ -149,9 +284,6 @@ function filterSentinel(collection) {
     (x) => !isSentinel(x)
   );
 }
-function isComplete(chunks) {
-  return isSentinel(chunks[chunks.length - 1]);
-}
 function getEmitteryCallbacks(emitter) {
   return {
     on: emitter.on.bind(emitter),
@@ -161,58 +293,75 @@ function getEmitteryCallbacks(emitter) {
   };
 }
-// src/audio/index.ts
-var audio_default = class extends Client {
-  constructor() {
-    super(...arguments);
-    this.isConnected = false;
+// src/tts/websocket.ts
+var _isConnected, _sampleRate2, _generateId, generateId_fn;
+var WebSocket = class extends Client {
+  /**
+   * Create a new WebSocket client.
+   *
+   * @param args - Arguments to pass to the Client constructor.
+   */
+  constructor({ sampleRate }, ...args) {
+    super(...args);
+    /**
+     * Generate a unique ID suitable for a streaming context.
+     *
+     * Not suitable for security purposes or as a primary key, since
+     * it lacks the amount of entropy required for those use cases.
+     *
+     * @returns A unique ID.
+     */
+    __privateAdd(this, _generateId);
+    __privateAdd(this, _isConnected, false);
+    __privateAdd(this, _sampleRate2, void 0);
+    __privateSet(this, _sampleRate2, sampleRate);
   }
   /**
-   * Stream audio from a model.
+   * Send a message over the WebSocket in order to start a stream.
    *
-   * @param inputs - Stream options. Includes a `model` key and some `parameters`, which
-   * are model-specific and can be found in the model's documentation.
+   * @param inputs - Stream options.
    * @param options - Options for the stream.
    * @param options.timeout - The maximum time to wait for a chunk before cancelling the stream.
    * If `0`, the stream will not time out.
-   * @returns An object with a method `play` of type `(bufferDuration: number) => Promise<void>`
-   * that plays the audio as it arrives, with `bufferDuration` seconds of audio buffered before
-   * starting playback.
+   * @returns A Source object that can be passed to a Player to play the audio.
    */
-  stream(inputs, { timeout = 0 } = {}) {
+  send(inputs, { timeout = 0 } = {}) {
     var _a, _b, _c, _d;
-    if (!this.isConnected) {
+    if (!__privateGet(this, _isConnected)) {
       throw new Error("Not connected to WebSocket. Call .connect() first.");
     }
-    const contextId = this.generateId();
+    const contextId = __privateMethod(this, _generateId, generateId_fn).call(this);
     (_a = this.socket) == null ? void 0 : _a.send(
-      JSON.stringify({
-        data: inputs,
+      JSON.stringify(__spreadProps(__spreadValues({
         context_id: contextId
-      })
+      }, inputs), {
+        output_format: {
+          container: "raw",
+          encoding: "pcm_f32le",
+          sample_rate: __privateGet(this, _sampleRate2)
+        }
+      }))
     );
+    const emitter = new import_emittery2.default();
+    const source = new Source({
+      sampleRate: __privateGet(this, _sampleRate2)
+    });
     const streamCompleteController = new AbortController();
     let timeoutId = null;
     if (timeout > 0) {
       timeoutId = setTimeout(streamCompleteController.abort, timeout);
     }
-    const chunks = [];
-    const emitter = new import_emittery.default();
     const handleMessage = createMessageHandlerForContextId(
       contextId,
       (_0) => __async(this, [_0], function* ({ chunk, message }) {
-        chunks.push(chunk);
-        yield emitter.emit("chunk", {
-          chunk,
-          chunks
-        });
-        yield emitter.emit("message", message);
+        emitter.emit("message", message);
         if (isSentinel(chunk)) {
-          yield emitter.emit("streamed", {
-            chunks
-          });
+          yield source.close();
           streamCompleteController.abort();
-        } else if (timeoutId) {
+          return;
+        }
+        yield source.enqueue(base64ToArray([chunk]));
+        if (timeoutId) {
           clearTimeout(timeoutId);
           timeoutId = setTimeout(streamCompleteController.abort, timeout);
         }
@@ -240,107 +389,12 @@ var audio_default = class extends Client {
       }
     );
     streamCompleteController.signal.addEventListener("abort", () => {
+      source.close();
       if (timeoutId) {
         clearTimeout(timeoutId);
       }
-      emitter.clearListeners();
-    });
-    const play = (_0) => __async(this, [_0], function* ({ bufferDuration }) {
-      const context = new AudioContext({
-        sampleRate: SAMPLE_RATE
-      });
-      let startNextPlaybackAt = 0;
-      const playLatestChunk = (chunk) => {
-        if (isSentinel(chunk)) {
-          return true;
-        }
-        startNextPlaybackAt = playAudioBuffer([chunk], context, startNextPlaybackAt) + Math.max(context.currentTime, startNextPlaybackAt);
-        return false;
-      };
-      const playChunks = (chunks2) => {
-        startNextPlaybackAt += playAudioBuffer(
-          chunks2,
-          context,
-          startNextPlaybackAt
-        );
-        if (isComplete(chunks2)) {
-          return;
-        }
-      };
-      const tryStart = (chunks2) => __async(this, null, function* () {
-        startNextPlaybackAt = context.currentTime;
-        if (isComplete(chunks2) || streamCompleteController.signal.aborted) {
-          emitter.emit("buffered");
-          playChunks(chunks2);
-          return true;
-        }
-        if (getBufferDuration(chunks2) > bufferDuration) {
-          emitter.emit("buffered");
-          playChunks(chunks2);
-          try {
-            for (var iter2 = __forAwait(emitter.events("chunk")), more2, temp2, error2; more2 = !(temp2 = yield iter2.next()).done; more2 = false) {
-              const { chunk } = temp2.value;
-              if (playLatestChunk(chunk)) {
-                break;
-              }
-            }
-          } catch (temp2) {
-            error2 = [temp2];
-          } finally {
-            try {
-              more2 && (temp2 = iter2.return) && (yield temp2.call(iter2));
-            } finally {
-              if (error2)
-                throw error2[0];
-            }
-          }
-          return true;
-        }
-        emitter.emit("buffering");
-        return false;
-      });
-      if (!(yield tryStart(chunks))) {
-        try {
-          for (var iter = __forAwait(emitter.events("chunk")), more, temp, error; more = !(temp = yield iter.next()).done; more = false) {
-            const { chunks: chunks2 } = temp.value;
-            if (yield tryStart(chunks2)) {
-              const playbackEndsIn = Math.max(0, startNextPlaybackAt - context.currentTime) * 1e3;
-              emitter.emit("scheduled", { playbackEndsIn });
-              break;
-            }
-          }
-        } catch (temp) {
-          error = [temp];
-        } finally {
-          try {
-            more && (temp = iter.return) && (yield temp.call(iter));
-          } finally {
-            if (error)
-              throw error[0];
-          }
-        }
-      } else {
-        const playbackEndsIn = Math.max(0, startNextPlaybackAt - context.currentTime) * 1e3;
-        emitter.emit("scheduled", { playbackEndsIn });
-      }
-    });
-    return __spreadValues({
-      play
-    }, getEmitteryCallbacks(emitter));
-  }
-  /**
-   * Generate a unique ID suitable for a streaming context.
-   *
-   * Not suitable for security purposes or as a primary key, since
-   * it lacks the amount of entropy required for those use cases.
-   *
-   * @returns A unique ID.
-   */
-  generateId() {
-    return (0, import_human_id.humanId)({
-      separator: "-",
-      capitalize: false
     });
+    return __spreadValues({ source }, getEmitteryCallbacks(emitter));
   }
   /**
    * Authenticate and connect to a Cartesia streaming WebSocket.
@@ -349,16 +403,16 @@ var audio_default = class extends Client {
    * @throws {Error} If the WebSocket fails to connect.
    */
   connect() {
-    const url = constructWebsocketUrl(this.baseUrl);
+    const url = constructApiUrl(this.baseUrl, "/tts/websocket", "ws");
     url.searchParams.set("api_key", this.apiKey);
-    const emitter = new import_emittery.default();
+    const emitter = new import_emittery2.default();
     this.socket = new import_partysocket.WebSocket(url.toString());
     this.socket.onopen = () => {
-      this.isConnected = true;
+      __privateSet(this, _isConnected, true);
       emitter.emit("open");
     };
     this.socket.onclose = () => {
-      this.isConnected = false;
+      __privateSet(this, _isConnected, false);
       emitter.emit("close");
     };
     return new Promise(
@@ -405,15 +459,194 @@ var audio_default = class extends Client {
     (_a = this.socket) == null ? void 0 : _a.close();
   }
 };
+_isConnected = new WeakMap();
+_sampleRate2 = new WeakMap();
+_generateId = new WeakSet();
+generateId_fn = function() {
+  return (0, import_human_id.humanId)({
+    separator: "-",
+    capitalize: false
+  });
+};
+// src/tts/index.ts
+var TTS = class extends Client {
+  /**
+   * Get a WebSocket client for streaming audio from the TTS API.
+   *
+   * @returns {WebSocket} A Cartesia WebSocket client.
+   */
+  websocket(options) {
+    return new WebSocket(options, {
+      apiKey: this.apiKey,
+      baseUrl: this.baseUrl
+    });
+  }
+};
+// src/voices/index.ts
+var Voices = class extends Client {
+  list() {
+    return __async(this, null, function* () {
+      const response = yield this.fetch("/voices");
+      return response.json();
+    });
+  }
+  get(voiceId) {
+    return __async(this, null, function* () {
+      const response = yield this.fetch(`/voices/${voiceId}`);
+      return response.json();
+    });
+  }
+  create(voice) {
+    return __async(this, null, function* () {
+      const response = yield this.fetch("/voices", {
+        method: "POST",
+        body: JSON.stringify(voice)
+      });
+      return response.json();
+    });
+  }
+  clone(options) {
+    return __async(this, null, function* () {
+      if (options.mode === "url") {
+        const response = yield this.fetch(
+          `/voices/clone/url?link=${options.link}`,
+          {
+            method: "POST"
+          }
+        );
+        return response.json();
+      }
+      if (options.mode === "clip") {
+        const formData = new FormData();
+        formData.append("clip", options.clip);
+        const response = yield this.fetch("/voices/clone/clip", {
+          method: "POST",
+          body: formData
+        });
+        return response.json();
+      }
+      throw new Error("Invalid mode for clone()");
+    });
+  }
+};
 // src/lib/index.ts
 var Cartesia = class extends Client {
   constructor(options = {}) {
     super(options);
-    this.audio = new audio_default(options);
+    this.tts = new TTS(options);
+    this.voices = new Voices(options);
   }
 };
+// src/tts/player.ts
+var import_emittery3 = __toESM(require("emittery"), 1);
+var _context, _startNextPlaybackAt, _bufferDuration, _emitter2, _playBuffer, playBuffer_fn;
+var Player = class {
+  /**
+   * Create a new Player.
+   *
+   * @param options - Options for the Player.
+   * @param options.bufferDuration - The duration of the audio buffer to play.
+   */
+  constructor({ bufferDuration }) {
+    __privateAdd(this, _playBuffer);
+    __privateAdd(this, _context, null);
+    __privateAdd(this, _startNextPlaybackAt, 0);
+    __privateAdd(this, _bufferDuration, void 0);
+    __privateAdd(this, _emitter2, new import_emittery3.default());
+    __privateSet(this, _bufferDuration, bufferDuration);
+  }
+  /**
+   * Play audio from a source.
+   *
+   * @param source The source to play audio from.
+   * @returns A promise that resolves when the audio has finished playing.
+   */
+  play(source) {
+    return __async(this, null, function* () {
+      __privateSet(this, _startNextPlaybackAt, 0);
+      __privateSet(this, _context, new AudioContext({ sampleRate: source.sampleRate }));
+      const buffer = new Float32Array(
+        source.durationToSampleCount(__privateGet(this, _bufferDuration))
+      );
+      const plays = [];
+      while (true) {
+        const read = yield source.read(buffer);
+        const playableAudio = buffer.slice(0, read);
+        plays.push(__privateMethod(this, _playBuffer, playBuffer_fn).call(this, playableAudio, source.sampleRate));
+        if (read < buffer.length) {
+          yield __privateGet(this, _emitter2).emit("finish");
+          break;
+        }
+      }
+      yield Promise.all(plays);
+    });
+  }
+  /**
+   * Pause the audio.
+   *
+   * @returns A promise that resolves when the audio has been paused.
+   */
+  pause() {
+    return __async(this, null, function* () {
+      if (!__privateGet(this, _context)) {
+        throw new Error("AudioContext not initialized.");
+      }
+      yield __privateGet(this, _context).suspend();
+    });
+  }
+  /**
+   * Resume the audio.
+   *
+   * @returns A promise that resolves when the audio has been resumed.
+   */
+  resume() {
+    return __async(this, null, function* () {
+      if (!__privateGet(this, _context)) {
+        throw new Error("AudioContext not initialized.");
+      }
+      yield __privateGet(this, _context).resume();
+    });
+  }
+  /**
+   * Toggle the audio.
+   *
+   * @returns A promise that resolves when the audio has been toggled.
+   */
+  toggle() {
+    return __async(this, null, function* () {
+      if (!__privateGet(this, _context)) {
+        throw new Error("AudioContext not initialized.");
+      }
+      if (__privateGet(this, _context).state === "running") {
+        yield this.pause();
+      } else {
+        yield this.resume();
+      }
+    });
+  }
+};
+_context = new WeakMap();
+_startNextPlaybackAt = new WeakMap();
+_bufferDuration = new WeakMap();
+_emitter2 = new WeakMap();
+_playBuffer = new WeakSet();
+playBuffer_fn = function(buf, sampleRate) {
+  return __async(this, null, function* () {
+    if (!__privateGet(this, _context)) {
+      throw new Error("AudioContext not initialized.");
+    }
+    const startAt = __privateGet(this, _startNextPlaybackAt);
+    const duration = buf.length / sampleRate;
+    __privateSet(this, _startNextPlaybackAt, duration + Math.max(__privateGet(this, _context).currentTime, __privateGet(this, _startNextPlaybackAt)));
+    yield playAudioBuffer(buf, __privateGet(this, _context), startAt, sampleRate);
+  });
+};
 // Annotate the CommonJS export names for ESM import in node:
 0 && (module.exports = {
-  Cartesia
+  Cartesia,
+  WebPlayer
 });