npm - @cartesia/cartesia-js - Versions diffs - 1.0.0-alpha.4 → 1.0.1 - Mend

@cartesia/cartesia-js 1.0.0-alpha.4 → 1.0.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (56) hide show

package/.turbo/turbo-build.log +49 -49
package/CHANGELOG.md +23 -0
package/LICENSE.md +21 -0
package/README.md +102 -21
package/dist/{chunk-VK7LBMVI.js → chunk-2NA5SEML.js} +2 -2
package/dist/{chunk-PQ5EVEEH.js → chunk-5M33ZF3Y.js} +1 -1
package/dist/{chunk-PQ6CIPFW.js → chunk-6YQ6KDIQ.js} +44 -5
package/dist/{chunk-IQAXBRHU.js → chunk-ASZKHN7Q.js} +53 -29
package/dist/{chunk-RO7TY474.js → chunk-BHY7MNGT.js} +11 -6
package/dist/{chunk-WIFMLPT5.js → chunk-GHY2WEOK.js} +13 -0
package/dist/{chunk-SGXUEFII.js → chunk-KUSVZXDT.js} +2 -2
package/dist/{chunk-36JBKJUN.js → chunk-LZO6K34D.js} +20 -7
package/dist/{chunk-3FL2SNIR.js → chunk-NQVZNVOU.js} +1 -1
package/dist/{chunk-ISRU7PLL.js → chunk-OFH3ML4L.js} +3 -3
package/dist/index.cjs +129 -39
package/dist/index.d.cts +4 -4
package/dist/index.d.ts +4 -4
package/dist/index.js +15 -9
package/dist/lib/client.js +2 -2
package/dist/lib/constants.js +1 -1
package/dist/lib/index.cjs +106 -33
package/dist/lib/index.js +8 -8
package/dist/react/index.cjs +231 -92
package/dist/react/index.d.cts +4 -3
package/dist/react/index.d.ts +4 -3
package/dist/react/index.js +117 -64
package/dist/react/utils.js +2 -2
package/dist/tts/index.cjs +106 -33
package/dist/tts/index.js +6 -6
package/dist/tts/player.cjs +23 -5
package/dist/tts/player.d.cts +6 -0
package/dist/tts/player.d.ts +6 -0
package/dist/tts/player.js +4 -3
package/dist/tts/source.cjs +50 -4
package/dist/tts/source.d.cts +16 -6
package/dist/tts/source.d.ts +16 -6
package/dist/tts/source.js +4 -2
package/dist/tts/utils.cjs +18 -6
package/dist/tts/utils.d.cts +7 -5
package/dist/tts/utils.d.ts +7 -5
package/dist/tts/utils.js +3 -2
package/dist/tts/websocket.cjs +106 -33
package/dist/tts/websocket.d.cts +20 -10
package/dist/tts/websocket.d.ts +20 -10
package/dist/tts/websocket.js +5 -5
package/dist/types/index.d.cts +60 -4
package/dist/types/index.d.ts +60 -4
package/dist/voices/index.js +3 -3
package/package.json +1 -1
package/src/index.ts +2 -0
package/src/react/index.ts +117 -62
package/src/tts/player.ts +15 -8
package/src/tts/source.ts +53 -7
package/src/tts/utils.ts +26 -12
package/src/tts/websocket.ts +42 -19
package/src/types/index.ts +81 -3

package/dist/tts/source.cjs CHANGED Viewed

@@ -44,6 +44,10 @@ var __privateSet = (obj, member, value, setter) => {
   setter ? setter.call(obj, value) : member.set(obj, value);
   return value;
 };
+var __privateMethod = (obj, member, method) => {
+  __accessCheck(obj, member, "access private method");
+  return method;
+};
 var __async = (__this, __arguments, generator) => {
   return new Promise((resolve, reject) => {
     var fulfilled = (value) => {
@@ -68,11 +72,18 @@ var __async = (__this, __arguments, generator) => {
 // src/tts/source.ts
 var source_exports = {};
 __export(source_exports, {
+  ENCODING_MAP: () => ENCODING_MAP,
   default: () => Source
 });
 module.exports = __toCommonJS(source_exports);
 var import_emittery = __toESM(require("emittery"), 1);
-var _emitter, _buffer, _readIndex, _writeIndex, _closed, _sampleRate;
+var ENCODING_MAP = {
+  pcm_f32le: { arrayType: Float32Array, bytesPerElement: 4 },
+  pcm_s16le: { arrayType: Int16Array, bytesPerElement: 2 },
+  pcm_alaw: { arrayType: Uint8Array, bytesPerElement: 1 },
+  pcm_mulaw: { arrayType: Uint8Array, bytesPerElement: 1 }
+};
+var _emitter, _buffer, _readIndex, _writeIndex, _closed, _sampleRate, _encoding, _container, _createBuffer, createBuffer_fn;
 var Source = class {
   /**
    * Create a new Source.
@@ -80,23 +91,44 @@ var Source = class {
    * @param options - Options for the Source.
    * @param options.sampleRate - The sample rate of the audio.
    */
-  constructor({ sampleRate }) {
+  constructor({
+    sampleRate,
+    encoding,
+    container
+  }) {
+    /**
+     * Create a new buffer for the source.
+     *
+     * @param size - The size of the buffer to create.
+     * @returns The new buffer as a TypedArray based on the encoding.
+     */
+    __privateAdd(this, _createBuffer);
     __privateAdd(this, _emitter, new import_emittery.default());
     __privateAdd(this, _buffer, void 0);
     __privateAdd(this, _readIndex, 0);
     __privateAdd(this, _writeIndex, 0);
     __privateAdd(this, _closed, false);
     __privateAdd(this, _sampleRate, void 0);
+    __privateAdd(this, _encoding, void 0);
+    __privateAdd(this, _container, void 0);
     this.on = __privateGet(this, _emitter).on.bind(__privateGet(this, _emitter));
     this.once = __privateGet(this, _emitter).once.bind(__privateGet(this, _emitter));
     this.events = __privateGet(this, _emitter).events.bind(__privateGet(this, _emitter));
     this.off = __privateGet(this, _emitter).off.bind(__privateGet(this, _emitter));
     __privateSet(this, _sampleRate, sampleRate);
-    __privateSet(this, _buffer, new Float32Array(1024));
+    __privateSet(this, _encoding, encoding);
+    __privateSet(this, _container, container);
+    __privateSet(this, _buffer, __privateMethod(this, _createBuffer, createBuffer_fn).call(this, 1024));
   }
   get sampleRate() {
     return __privateGet(this, _sampleRate);
   }
+  get encoding() {
+    return __privateGet(this, _encoding);
+  }
+  get container() {
+    return __privateGet(this, _container);
+  }
   /**
    * Append audio to the buffer.
    *
@@ -110,7 +142,7 @@ var Source = class {
         while (newCapacity < requiredCapacity) {
           newCapacity *= 2;
         }
-        const newBuffer = new Float32Array(newCapacity);
+        const newBuffer = __privateMethod(this, _createBuffer, createBuffer_fn).call(this, newCapacity);
         newBuffer.set(__privateGet(this, _buffer));
         __privateSet(this, _buffer, newBuffer);
       }
@@ -158,6 +190,9 @@ var Source = class {
   get readIndex() {
     return __privateGet(this, _readIndex);
   }
+  get writeIndex() {
+    return __privateGet(this, _writeIndex);
+  }
   /**
    * Close the source. This signals that no more audio will be enqueued.
    *
@@ -179,3 +214,14 @@ _readIndex = new WeakMap();
 _writeIndex = new WeakMap();
 _closed = new WeakMap();
 _sampleRate = new WeakMap();
+_encoding = new WeakMap();
+_container = new WeakMap();
+_createBuffer = new WeakSet();
+createBuffer_fn = function(size) {
+  const { arrayType: ArrayType } = ENCODING_MAP[__privateGet(this, _encoding)];
+  return new ArrayType(size);
+};
+// Annotate the CommonJS export names for ESM import in node:
+0 && (module.exports = {
+  ENCODING_MAP
+});

package/dist/tts/source.d.cts CHANGED Viewed

@@ -1,6 +1,11 @@
 import * as emittery from 'emittery';
-import { SourceEventData } from '../types/index.cjs';
+import { Encoding, SourceEventData, TypedArray } from '../types/index.cjs';
+type EncodingInfo = {
+    arrayType: Float32ArrayConstructor | Int16ArrayConstructor | Uint8ArrayConstructor;
+    bytesPerElement: number;
+};
+declare const ENCODING_MAP: Record<Encoding, EncodingInfo>;
 declare class Source {
     #private;
     on: <Name extends keyof SourceEventData | keyof emittery.OmnipresentEventData>(eventName: Name | readonly Name[], listener: (eventData: (SourceEventData & emittery.OmnipresentEventData)[Name]) => void | Promise<void>) => emittery.UnsubscribeFunction;
@@ -13,16 +18,20 @@ declare class Source {
      * @param options - Options for the Source.
      * @param options.sampleRate - The sample rate of the audio.
      */
-    constructor({ sampleRate }: {
+    constructor({ sampleRate, encoding, container, }: {
         sampleRate: number;
+        encoding: string;
+        container: string;
     });
     get sampleRate(): number;
+    get encoding(): Encoding;
+    get container(): string;
     /**
      * Append audio to the buffer.
      *
      * @param src The audio to append.
      */
-    enqueue(src: Float32Array): Promise<void>;
+    enqueue(src: TypedArray): Promise<void>;
     /**
      * Read audio from the buffer.
      *
@@ -30,7 +39,7 @@ declare class Source {
      * @returns The number of samples read. If the source is closed, this will be
      * less than the length of the provided buffer.
      */
-    read(dst: Float32Array): Promise<number>;
+    read(dst: TypedArray): Promise<number>;
     /**
      * Get the number of samples in a given duration.
      *
@@ -38,8 +47,9 @@ declare class Source {
      * @returns The number of samples.
      */
     durationToSampleCount(durationSecs: number): number;
-    get buffer(): Float32Array;
+    get buffer(): TypedArray;
     get readIndex(): number;
+    get writeIndex(): number;
     /**
      * Close the source. This signals that no more audio will be enqueued.
      *
@@ -50,4 +60,4 @@ declare class Source {
     close(): Promise<void>;
 }
-export { Source as default };
+export { ENCODING_MAP, Source as default };

package/dist/tts/source.d.ts CHANGED Viewed

@@ -1,6 +1,11 @@
 import * as emittery from 'emittery';
-import { SourceEventData } from '../types/index.js';
+import { Encoding, SourceEventData, TypedArray } from '../types/index.js';
+type EncodingInfo = {
+    arrayType: Float32ArrayConstructor | Int16ArrayConstructor | Uint8ArrayConstructor;
+    bytesPerElement: number;
+};
+declare const ENCODING_MAP: Record<Encoding, EncodingInfo>;
 declare class Source {
     #private;
     on: <Name extends keyof SourceEventData | keyof emittery.OmnipresentEventData>(eventName: Name | readonly Name[], listener: (eventData: (SourceEventData & emittery.OmnipresentEventData)[Name]) => void | Promise<void>) => emittery.UnsubscribeFunction;
@@ -13,16 +18,20 @@ declare class Source {
      * @param options - Options for the Source.
      * @param options.sampleRate - The sample rate of the audio.
      */
-    constructor({ sampleRate }: {
+    constructor({ sampleRate, encoding, container, }: {
         sampleRate: number;
+        encoding: string;
+        container: string;
     });
     get sampleRate(): number;
+    get encoding(): Encoding;
+    get container(): string;
     /**
      * Append audio to the buffer.
      *
      * @param src The audio to append.
      */
-    enqueue(src: Float32Array): Promise<void>;
+    enqueue(src: TypedArray): Promise<void>;
     /**
      * Read audio from the buffer.
      *
@@ -30,7 +39,7 @@ declare class Source {
      * @returns The number of samples read. If the source is closed, this will be
      * less than the length of the provided buffer.
      */
-    read(dst: Float32Array): Promise<number>;
+    read(dst: TypedArray): Promise<number>;
     /**
      * Get the number of samples in a given duration.
      *
@@ -38,8 +47,9 @@ declare class Source {
      * @returns The number of samples.
      */
     durationToSampleCount(durationSecs: number): number;
-    get buffer(): Float32Array;
+    get buffer(): TypedArray;
     get readIndex(): number;
+    get writeIndex(): number;
     /**
      * Close the source. This signals that no more audio will be enqueued.
      *
@@ -50,4 +60,4 @@ declare class Source {
     close(): Promise<void>;
 }
-export { Source as default };
+export { ENCODING_MAP, Source as default };

package/dist/tts/source.js CHANGED Viewed

@@ -1,7 +1,9 @@
 import {
+  ENCODING_MAP,
   Source
-} from "../chunk-PQ6CIPFW.js";
-import "../chunk-WIFMLPT5.js";
+} from "../chunk-6YQ6KDIQ.js";
+import "../chunk-GHY2WEOK.js";
 export {
+  ENCODING_MAP,
   Source as default
 };

package/dist/tts/utils.cjs CHANGED Viewed

@@ -41,16 +41,28 @@ __export(utils_exports, {
 });
 module.exports = __toCommonJS(utils_exports);
 var import_base64_js = __toESM(require("base64-js"), 1);
-function base64ToArray(b64) {
+// src/tts/source.ts
+var import_emittery = __toESM(require("emittery"), 1);
+var ENCODING_MAP = {
+  pcm_f32le: { arrayType: Float32Array, bytesPerElement: 4 },
+  pcm_s16le: { arrayType: Int16Array, bytesPerElement: 2 },
+  pcm_alaw: { arrayType: Uint8Array, bytesPerElement: 1 },
+  pcm_mulaw: { arrayType: Uint8Array, bytesPerElement: 1 }
+};
+// src/tts/utils.ts
+function base64ToArray(b64, encoding) {
   const byteArrays = filterSentinel(b64).map((b) => import_base64_js.default.toByteArray(b));
+  const { arrayType: ArrayType, bytesPerElement } = ENCODING_MAP[encoding];
   const totalLength = byteArrays.reduce(
-    (acc, arr) => acc + arr.length / Float32Array.BYTES_PER_ELEMENT,
+    (acc, arr) => acc + arr.length / bytesPerElement,
     0
   );
-  const result = new Float32Array(totalLength);
+  const result = new ArrayType(totalLength);
   let offset = 0;
   for (const arr of byteArrays) {
-    const floats = new Float32Array(arr.buffer);
+    const floats = new ArrayType(arr.buffer);
     result.set(floats, offset);
     offset += floats.length;
   }
@@ -81,10 +93,10 @@ function createMessageHandlerForContextId(contextId, handler) {
     let chunk;
     if (message.done) {
       chunk = getSentinel();
-    } else {
+    } else if (message.type === "chunk") {
       chunk = message.data;
     }
-    handler({ chunk, message: event.data });
+    handler({ chunk, message: event.data, data: message });
   };
 }
 function getSentinel() {

package/dist/tts/utils.d.cts CHANGED Viewed

@@ -1,14 +1,15 @@
 import emittery__default from 'emittery';
-import { Chunk, Sentinel, EmitteryCallbacks } from '../types/index.cjs';
+import { Chunk, TypedArray, WebSocketResponse, Sentinel, EmitteryCallbacks } from '../types/index.cjs';
 /**
- * Convert base64-encoded audio buffer(s) to a Float32Array.
+ * Convert base64-encoded audio buffer(s) to a TypedArray.
  *
  * @param b64 The base64-encoded audio buffer, or an array of base64-encoded
  * audio buffers.
- * @returns The audio buffer(s) as a Float32Array.
+ * @param encoding The encoding of the audio buffer(s).
+ * @returns The audio buffer(s) as a TypedArray.
  */
-declare function base64ToArray(b64: Chunk[]): Float32Array;
+declare function base64ToArray(b64: Chunk[], encoding: string): TypedArray;
 /**
  * Schedule an audio buffer to play at a given time in the passed context.
  *
@@ -28,8 +29,9 @@ declare function playAudioBuffer(floats: Float32Array, context: AudioContext, st
  * @returns A message event handler.
  */
 declare function createMessageHandlerForContextId(contextId: string, handler: ({ chunk, message, }: {
-    chunk: Chunk;
+    chunk?: Chunk;
     message: string;
+    data: WebSocketResponse;
 }) => void): (event: MessageEvent) => void;
 /**
  * Get a sentinel value that indicates the end of a stream.

package/dist/tts/utils.d.ts CHANGED Viewed

@@ -1,14 +1,15 @@
 import emittery__default from 'emittery';
-import { Chunk, Sentinel, EmitteryCallbacks } from '../types/index.js';
+import { Chunk, TypedArray, WebSocketResponse, Sentinel, EmitteryCallbacks } from '../types/index.js';
 /**
- * Convert base64-encoded audio buffer(s) to a Float32Array.
+ * Convert base64-encoded audio buffer(s) to a TypedArray.
  *
  * @param b64 The base64-encoded audio buffer, or an array of base64-encoded
  * audio buffers.
- * @returns The audio buffer(s) as a Float32Array.
+ * @param encoding The encoding of the audio buffer(s).
+ * @returns The audio buffer(s) as a TypedArray.
  */
-declare function base64ToArray(b64: Chunk[]): Float32Array;
+declare function base64ToArray(b64: Chunk[], encoding: string): TypedArray;
 /**
  * Schedule an audio buffer to play at a given time in the passed context.
  *
@@ -28,8 +29,9 @@ declare function playAudioBuffer(floats: Float32Array, context: AudioContext, st
  * @returns A message event handler.
  */
 declare function createMessageHandlerForContextId(contextId: string, handler: ({ chunk, message, }: {
-    chunk: Chunk;
+    chunk?: Chunk;
     message: string;
+    data: WebSocketResponse;
 }) => void): (event: MessageEvent) => void;
 /**
  * Get a sentinel value that indicates the end of a stream.

package/dist/tts/utils.js CHANGED Viewed

@@ -7,8 +7,9 @@ import {
   isComplete,
   isSentinel,
   playAudioBuffer
-} from "../chunk-RO7TY474.js";
-import "../chunk-WIFMLPT5.js";
+} from "../chunk-BHY7MNGT.js";
+import "../chunk-6YQ6KDIQ.js";
+import "../chunk-GHY2WEOK.js";
 export {
   base64ToArray,
   createMessageHandlerForContextId,

package/dist/tts/websocket.cjs CHANGED Viewed

@@ -22,6 +22,18 @@ var __spreadValues = (a, b) => {
   return a;
 };
 var __spreadProps = (a, b) => __defProps(a, __getOwnPropDescs(b));
+var __objRest = (source, exclude) => {
+  var target = {};
+  for (var prop in source)
+    if (__hasOwnProp.call(source, prop) && exclude.indexOf(prop) < 0)
+      target[prop] = source[prop];
+  if (source != null && __getOwnPropSymbols)
+    for (var prop of __getOwnPropSymbols(source)) {
+      if (exclude.indexOf(prop) < 0 && __propIsEnum.call(source, prop))
+        target[prop] = source[prop];
+    }
+  return target;
+};
 var __export = (target, all) => {
   for (var name in all)
     __defProp(target, name, { get: all[name], enumerable: true });
@@ -132,7 +144,13 @@ var Client = class {
 // src/tts/source.ts
 var import_emittery = __toESM(require("emittery"), 1);
-var _emitter, _buffer, _readIndex, _writeIndex, _closed, _sampleRate;
+var ENCODING_MAP = {
+  pcm_f32le: { arrayType: Float32Array, bytesPerElement: 4 },
+  pcm_s16le: { arrayType: Int16Array, bytesPerElement: 2 },
+  pcm_alaw: { arrayType: Uint8Array, bytesPerElement: 1 },
+  pcm_mulaw: { arrayType: Uint8Array, bytesPerElement: 1 }
+};
+var _emitter, _buffer, _readIndex, _writeIndex, _closed, _sampleRate, _encoding, _container, _createBuffer, createBuffer_fn;
 var Source = class {
   /**
    * Create a new Source.
@@ -140,23 +158,44 @@ var Source = class {
    * @param options - Options for the Source.
    * @param options.sampleRate - The sample rate of the audio.
    */
-  constructor({ sampleRate }) {
+  constructor({
+    sampleRate,
+    encoding,
+    container
+  }) {
+    /**
+     * Create a new buffer for the source.
+     *
+     * @param size - The size of the buffer to create.
+     * @returns The new buffer as a TypedArray based on the encoding.
+     */
+    __privateAdd(this, _createBuffer);
     __privateAdd(this, _emitter, new import_emittery.default());
     __privateAdd(this, _buffer, void 0);
     __privateAdd(this, _readIndex, 0);
     __privateAdd(this, _writeIndex, 0);
     __privateAdd(this, _closed, false);
     __privateAdd(this, _sampleRate, void 0);
+    __privateAdd(this, _encoding, void 0);
+    __privateAdd(this, _container, void 0);
     this.on = __privateGet(this, _emitter).on.bind(__privateGet(this, _emitter));
     this.once = __privateGet(this, _emitter).once.bind(__privateGet(this, _emitter));
     this.events = __privateGet(this, _emitter).events.bind(__privateGet(this, _emitter));
     this.off = __privateGet(this, _emitter).off.bind(__privateGet(this, _emitter));
     __privateSet(this, _sampleRate, sampleRate);
-    __privateSet(this, _buffer, new Float32Array(1024));
+    __privateSet(this, _encoding, encoding);
+    __privateSet(this, _container, container);
+    __privateSet(this, _buffer, __privateMethod(this, _createBuffer, createBuffer_fn).call(this, 1024));
   }
   get sampleRate() {
     return __privateGet(this, _sampleRate);
   }
+  get encoding() {
+    return __privateGet(this, _encoding);
+  }
+  get container() {
+    return __privateGet(this, _container);
+  }
   /**
    * Append audio to the buffer.
    *
@@ -170,7 +209,7 @@ var Source = class {
         while (newCapacity < requiredCapacity) {
           newCapacity *= 2;
         }
-        const newBuffer = new Float32Array(newCapacity);
+        const newBuffer = __privateMethod(this, _createBuffer, createBuffer_fn).call(this, newCapacity);
         newBuffer.set(__privateGet(this, _buffer));
         __privateSet(this, _buffer, newBuffer);
       }
@@ -218,6 +257,9 @@ var Source = class {
   get readIndex() {
     return __privateGet(this, _readIndex);
   }
+  get writeIndex() {
+    return __privateGet(this, _writeIndex);
+  }
   /**
    * Close the source. This signals that no more audio will be enqueued.
    *
@@ -239,19 +281,27 @@ _readIndex = new WeakMap();
 _writeIndex = new WeakMap();
 _closed = new WeakMap();
 _sampleRate = new WeakMap();
+_encoding = new WeakMap();
+_container = new WeakMap();
+_createBuffer = new WeakSet();
+createBuffer_fn = function(size) {
+  const { arrayType: ArrayType } = ENCODING_MAP[__privateGet(this, _encoding)];
+  return new ArrayType(size);
+};
 // src/tts/utils.ts
 var import_base64_js = __toESM(require("base64-js"), 1);
-function base64ToArray(b64) {
+function base64ToArray(b64, encoding) {
   const byteArrays = filterSentinel(b64).map((b) => import_base64_js.default.toByteArray(b));
+  const { arrayType: ArrayType, bytesPerElement } = ENCODING_MAP[encoding];
   const totalLength = byteArrays.reduce(
-    (acc, arr) => acc + arr.length / Float32Array.BYTES_PER_ELEMENT,
+    (acc, arr) => acc + arr.length / bytesPerElement,
     0
   );
-  const result = new Float32Array(totalLength);
+  const result = new ArrayType(totalLength);
   let offset = 0;
   for (const arr of byteArrays) {
-    const floats = new Float32Array(arr.buffer);
+    const floats = new ArrayType(arr.buffer);
     result.set(floats, offset);
     offset += floats.length;
   }
@@ -269,10 +319,10 @@ function createMessageHandlerForContextId(contextId, handler) {
     let chunk;
     if (message.done) {
       chunk = getSentinel();
-    } else {
+    } else if (message.type === "chunk") {
       chunk = message.data;
     }
-    handler({ chunk, message: event.data });
+    handler({ chunk, message: event.data, data: message });
   };
 }
 function getSentinel() {
@@ -296,14 +346,14 @@ function getEmitteryCallbacks(emitter) {
 }
 // src/tts/websocket.ts
-var _isConnected, _sampleRate2, _generateId, generateId_fn;
+var _isConnected, _sampleRate2, _container2, _encoding2, _generateId, generateId_fn;
 var WebSocket = class extends Client {
   /**
    * Create a new WebSocket client.
    *
    * @param args - Arguments to pass to the Client constructor.
    */
-  constructor({ sampleRate }, ...args) {
+  constructor({ sampleRate, container, encoding }, ...args) {
     super(...args);
     /**
      * Generate a unique ID suitable for a streaming context.
@@ -316,37 +366,47 @@ var WebSocket = class extends Client {
     __privateAdd(this, _generateId);
     __privateAdd(this, _isConnected, false);
     __privateAdd(this, _sampleRate2, void 0);
+    __privateAdd(this, _container2, void 0);
+    __privateAdd(this, _encoding2, void 0);
     __privateSet(this, _sampleRate2, sampleRate);
+    __privateSet(this, _container2, container != null ? container : "raw");
+    __privateSet(this, _encoding2, encoding != null ? encoding : "pcm_f32le");
   }
   /**
-   * Send a message over the WebSocket in order to start a stream.
+   * Send a message over the WebSocket to start a stream.
    *
-   * @param inputs - Stream options.
+   * @param inputs - Stream options. Defined in the StreamRequest type.
    * @param options - Options for the stream.
    * @param options.timeout - The maximum time to wait for a chunk before cancelling the stream.
-   * If `0`, the stream will not time out.
+   *                          If set to `0`, the stream will not time out.
    * @returns A Source object that can be passed to a Player to play the audio.
+   * @returns An Emittery instance that emits messages from the WebSocket.
+   * @returns An abort function that can be called to cancel the stream.
    */
-  send(inputs, { timeout = 0 } = {}) {
-    var _a, _b, _c, _d;
+  send(_a, { timeout = 0 } = {}) {
+    var inputs = __objRest(_a, []);
+    var _a2, _b, _c, _d;
     if (!__privateGet(this, _isConnected)) {
       throw new Error("Not connected to WebSocket. Call .connect() first.");
     }
-    const contextId = __privateMethod(this, _generateId, generateId_fn).call(this);
-    (_a = this.socket) == null ? void 0 : _a.send(
-      JSON.stringify(__spreadProps(__spreadValues({
-        context_id: contextId
-      }, inputs), {
-        output_format: {
-          container: "raw",
-          encoding: "pcm_f32le",
-          sample_rate: __privateGet(this, _sampleRate2)
-        }
-      }))
+    if (!inputs.context_id) {
+      inputs.context_id = __privateMethod(this, _generateId, generateId_fn).call(this);
+    }
+    if (!inputs.output_format) {
+      inputs.output_format = {
+        container: __privateGet(this, _container2),
+        encoding: __privateGet(this, _encoding2),
+        sample_rate: __privateGet(this, _sampleRate2)
+      };
+    }
+    (_a2 = this.socket) == null ? void 0 : _a2.send(
+      JSON.stringify(__spreadValues({}, inputs))
     );
     const emitter = new import_emittery2.default();
     const source = new Source({
-      sampleRate: __privateGet(this, _sampleRate2)
+      sampleRate: __privateGet(this, _sampleRate2),
+      encoding: __privateGet(this, _encoding2),
+      container: __privateGet(this, _container2)
     });
     const streamCompleteController = new AbortController();
     let timeoutId = null;
@@ -354,19 +414,26 @@ var WebSocket = class extends Client {
       timeoutId = setTimeout(streamCompleteController.abort, timeout);
     }
     const handleMessage = createMessageHandlerForContextId(
-      contextId,
-      (_0) => __async(this, [_0], function* ({ chunk, message }) {
+      inputs.context_id,
+      (_0) => __async(this, [_0], function* ({ chunk, message, data }) {
         emitter.emit("message", message);
+        if (data.type === "timestamps") {
+          emitter.emit("timestamps", data.word_timestamps);
+          return;
+        }
         if (isSentinel(chunk)) {
           yield source.close();
           streamCompleteController.abort();
           return;
         }
-        yield source.enqueue(base64ToArray([chunk]));
         if (timeoutId) {
           clearTimeout(timeoutId);
           timeoutId = setTimeout(streamCompleteController.abort, timeout);
         }
+        if (!chunk) {
+          return;
+        }
+        yield source.enqueue(base64ToArray([chunk], __privateGet(this, _encoding2)));
       })
     );
     (_b = this.socket) == null ? void 0 : _b.addEventListener("message", handleMessage, {
@@ -396,7 +463,11 @@ var WebSocket = class extends Client {
         clearTimeout(timeoutId);
       }
     });
-    return __spreadValues({ source }, getEmitteryCallbacks(emitter));
+    return __spreadProps(__spreadValues({
+      source
+    }, getEmitteryCallbacks(emitter)), {
+      stop: streamCompleteController.abort.bind(streamCompleteController)
+    });
   }
   /**
    * Authenticate and connect to a Cartesia streaming WebSocket.
@@ -466,6 +537,8 @@ var WebSocket = class extends Client {
 };
 _isConnected = new WeakMap();
 _sampleRate2 = new WeakMap();
+_container2 = new WeakMap();
+_encoding2 = new WeakMap();
 _generateId = new WeakSet();
 generateId_fn = function() {
   return (0, import_human_id.humanId)({