npm - kugelaudio - Versions diffs - 0.1.1 → 0.1.2 - Mend

kugelaudio 0.1.1 → 0.1.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (9) hide show

package/README.md CHANGED Viewed

@@ -31,7 +31,7 @@ const client = new KugelAudio({ apiKey: 'your_api_key' });
 // Generate speech
 const audio = await client.tts.generate({
   text: 'Hello, world!',
-  model: 'kugel-one-turbo',
+  model: 'kugel-1-turbo',
 });
 // Create a playable blob (browser)
@@ -86,8 +86,8 @@ const client = new KugelAudio({
 | Model ID | Name | Parameters | Description |
 |----------|------|------------|-------------|
-| `kugel-one-turbo` | Kugel One Turbo | 1.5B | Fast, low-latency model for real-time applications |
-| `kugel-one` | Kugel One | 7B | Premium quality model for pre-recorded content |
+| `kugel-1-turbo` | Kugel 1 Turbo | 1.5B | Fast, low-latency model for real-time applications |
+| `kugel-1` | Kugel 1 | 7B | Premium quality model for pre-recorded content |
 ### List Available Models
@@ -144,7 +144,7 @@ Generate complete audio and receive it all at once:
 ```typescript
 const audio = await client.tts.generate({
   text: 'Hello, this is a test of the KugelAudio text-to-speech system.',
-  model: 'kugel-one-turbo',  // 'kugel-one-turbo' (fast) or 'kugel-one' (quality)
+  model: 'kugel-1-turbo',  // 'kugel-1-turbo' (fast) or 'kugel-1' (quality)
   voiceId: 123,              // Optional: specific voice ID
   cfgScale: 2.0,             // Guidance scale (1.0-5.0)
   maxNewTokens: 2048,        // Maximum tokens to generate
@@ -169,7 +169,7 @@ import { createWavBlob } from 'kugelaudio';
 const audio = await client.tts.generate({
   text: 'Hello, world!',
-  model: 'kugel-one-turbo',
+  model: 'kugel-1-turbo',
 });
 // Create WAV blob for playback
@@ -198,7 +198,7 @@ Receive audio chunks as they are generated for lower latency:
 await client.tts.stream(
   {
     text: 'Hello, this is streaming audio.',
-    model: 'kugel-one-turbo',
+    model: 'kugel-1-turbo',
   },
   {
     onOpen: () => {
@@ -300,7 +300,7 @@ interface KugelAudioOptions {
 ```typescript
 interface GenerateOptions {
   text: string;            // Required: Text to synthesize
-  model?: string;          // Default: 'kugel-one-turbo'
+  model?: string;          // Default: 'kugel-1-turbo'
   voiceId?: number;        // Optional: Voice ID
   cfgScale?: number;       // Default: 2.0
   maxNewTokens?: number;   // Default: 2048
@@ -364,7 +364,7 @@ interface StreamCallbacks {
 ```typescript
 interface Model {
-  id: string;             // 'kugel-one-turbo' or 'kugel-one'
+  id: string;             // 'kugel-1-turbo' or 'kugel-1'
   name: string;           // Human-readable name
   description: string;    // Model description
   parameters: string;     // Parameter count ('1.5B', '7B')
@@ -467,7 +467,7 @@ async function main() {
   await client.tts.stream(
     {
       text: 'Welcome to KugelAudio. This is an example of high-quality text-to-speech synthesis.',
-      model: 'kugel-one-turbo',
+      model: 'kugel-1-turbo',
     },
     {
       onChunk: (chunk) => {

package/dist/index.d.mts CHANGED Viewed

@@ -47,7 +47,7 @@ interface Voice {
 interface GenerateOptions {
     /** Text to synthesize */
     text: string;
-    /** Model to use (default: 'kugel-one-turbo') */
+    /** Model to use: 'kugel-1-turbo' (1.5B, fast) or 'kugel-1' (7B, premium). Default: 'kugel-1-turbo' */
     model?: string;
     /** Voice ID to use */
     voiceId?: number;
@@ -200,16 +200,46 @@ declare class VoicesResource {
  */
 declare class TTSResource {
     private client;
+    private wsConnection;
+    private wsUrl;
+    private pendingRequests;
+    private requestCounter;
     constructor(client: KugelAudio);
     /**
      * Generate audio from text with streaming via WebSocket.
      * Returns complete audio after all chunks are received.
      */
     generate(options: GenerateOptions): Promise<AudioResponse>;
+    /**
+     * Get or create a WebSocket connection for connection pooling.
+     * This avoids the ~220ms connect overhead on each request.
+     */
+    private getConnection;
+    /**
+     * Setup message handler for pooled connection.
+     */
+    private setupMessageHandler;
     /**
      * Stream audio from text via WebSocket.
+     * Uses connection pooling for faster TTFA (~180ms vs ~400ms).
+     *
+     * @param options - Generation options
+     * @param callbacks - Stream callbacks
+     * @param reuseConnection - If true (default), reuse WebSocket connection
+     */
+    stream(options: GenerateOptions, callbacks: StreamCallbacks, reuseConnection?: boolean): Promise<void>;
+    /**
+     * Stream with connection pooling (fast path).
+     */
+    private streamWithPooling;
+    /**
+     * Stream without connection pooling (original behavior).
      */
-    stream(options: GenerateOptions, callbacks: StreamCallbacks): Promise<void>;
+    private streamWithoutPooling;
+    /**
+     * Close the pooled WebSocket connection.
+     */
+    close(): void;
     private parseError;
 }
 /**
@@ -225,10 +255,16 @@ declare class TTSResource {
  * // List voices
  * const voices = await client.voices.list();
  *
- * // Generate audio
+ * // Generate audio with fast model (1.5B params)
+ * const audio = await client.tts.generate({
+ *   text: 'Hello, world!',
+ *   model: 'kugel-1-turbo',
+ * });
+ *
+ * // Generate audio with premium model (7B params)
  * const audio = await client.tts.generate({
  *   text: 'Hello, world!',
- *   model: 'kugel-one-turbo',
+ *   model: 'kugel-1',
  * });
  * ```
  */
@@ -248,6 +284,11 @@ declare class KugelAudio {
     get apiKey(): string;
     /** Get TTS URL */
     get ttsUrl(): string;
+    /**
+     * Close the client and release resources.
+     * This closes any pooled WebSocket connections.
+     */
+    close(): void;
     /**
      * Make an HTTP request to the API.
      * @internal

package/dist/index.d.ts CHANGED Viewed

@@ -47,7 +47,7 @@ interface Voice {
 interface GenerateOptions {
     /** Text to synthesize */
     text: string;
-    /** Model to use (default: 'kugel-one-turbo') */
+    /** Model to use: 'kugel-1-turbo' (1.5B, fast) or 'kugel-1' (7B, premium). Default: 'kugel-1-turbo' */
     model?: string;
     /** Voice ID to use */
     voiceId?: number;
@@ -200,16 +200,46 @@ declare class VoicesResource {
  */
 declare class TTSResource {
     private client;
+    private wsConnection;
+    private wsUrl;
+    private pendingRequests;
+    private requestCounter;
     constructor(client: KugelAudio);
     /**
      * Generate audio from text with streaming via WebSocket.
      * Returns complete audio after all chunks are received.
      */
     generate(options: GenerateOptions): Promise<AudioResponse>;
+    /**
+     * Get or create a WebSocket connection for connection pooling.
+     * This avoids the ~220ms connect overhead on each request.
+     */
+    private getConnection;
+    /**
+     * Setup message handler for pooled connection.
+     */
+    private setupMessageHandler;
     /**
      * Stream audio from text via WebSocket.
+     * Uses connection pooling for faster TTFA (~180ms vs ~400ms).
+     *
+     * @param options - Generation options
+     * @param callbacks - Stream callbacks
+     * @param reuseConnection - If true (default), reuse WebSocket connection
+     */
+    stream(options: GenerateOptions, callbacks: StreamCallbacks, reuseConnection?: boolean): Promise<void>;
+    /**
+     * Stream with connection pooling (fast path).
+     */
+    private streamWithPooling;
+    /**
+     * Stream without connection pooling (original behavior).
      */
-    stream(options: GenerateOptions, callbacks: StreamCallbacks): Promise<void>;
+    private streamWithoutPooling;
+    /**
+     * Close the pooled WebSocket connection.
+     */
+    close(): void;
     private parseError;
 }
 /**
@@ -225,10 +255,16 @@ declare class TTSResource {
  * // List voices
  * const voices = await client.voices.list();
  *
- * // Generate audio
+ * // Generate audio with fast model (1.5B params)
+ * const audio = await client.tts.generate({
+ *   text: 'Hello, world!',
+ *   model: 'kugel-1-turbo',
+ * });
+ *
+ * // Generate audio with premium model (7B params)
  * const audio = await client.tts.generate({
  *   text: 'Hello, world!',
- *   model: 'kugel-one-turbo',
+ *   model: 'kugel-1',
  * });
  * ```
  */
@@ -248,6 +284,11 @@ declare class KugelAudio {
     get apiKey(): string;
     /** Get TTS URL */
     get ttsUrl(): string;
+    /**
+     * Close the client and release resources.
+     * This closes any pooled WebSocket connections.
+     */
+    close(): void;
     /**
      * Make an HTTP request to the API.
      * @internal

package/dist/index.js CHANGED Viewed

@@ -212,6 +212,10 @@ var VoicesResource = class {
 var TTSResource = class {
   constructor(client) {
     this.client = client;
+    this.wsConnection = null;
+    this.wsUrl = null;
+    this.pendingRequests = /* @__PURE__ */ new Map();
+    this.requestCounter = 0;
   }
   /**
    * Generate audio from text with streaming via WebSocket.
@@ -244,10 +248,142 @@ var TTSResource = class {
       rtf: finalStats ? finalStats.rtf : 0
     };
   }
+  /**
+   * Get or create a WebSocket connection for connection pooling.
+   * This avoids the ~220ms connect overhead on each request.
+   */
+  async getConnection() {
+    const wsUrl = this.client.ttsUrl.replace("https://", "wss://").replace("http://", "ws://");
+    const url = `${wsUrl}/ws/tts?api_key=${this.client.apiKey}`;
+    if (this.wsConnection && this.wsUrl === url && this.wsConnection.readyState === WebSocket.OPEN) {
+      return this.wsConnection;
+    }
+    if (this.wsConnection) {
+      try {
+        this.wsConnection.close();
+      } catch {
+      }
+      this.wsConnection = null;
+    }
+    return new Promise((resolve, reject) => {
+      const ws = new WebSocket(url);
+      ws.onopen = () => {
+        this.wsConnection = ws;
+        this.wsUrl = url;
+        this.setupMessageHandler(ws);
+        resolve(ws);
+      };
+      ws.onerror = () => {
+        reject(new KugelAudioError("WebSocket connection error"));
+      };
+    });
+  }
+  /**
+   * Setup message handler for pooled connection.
+   */
+  setupMessageHandler(ws) {
+    ws.onmessage = (event) => {
+      try {
+        const data = JSON.parse(event.data);
+        const [requestId, pending] = [...this.pendingRequests.entries()][0] || [];
+        if (!pending) return;
+        if (data.error) {
+          const error = this.parseError(data.error);
+          pending.callbacks.onError?.(error);
+          this.pendingRequests.delete(requestId);
+          pending.reject(error);
+          return;
+        }
+        if (data.final) {
+          const stats = {
+            final: true,
+            chunks: data.chunks,
+            totalSamples: data.total_samples,
+            durationMs: data.dur_ms,
+            generationMs: data.gen_ms,
+            ttfaMs: data.ttfa_ms,
+            rtf: data.rtf,
+            error: data.error
+          };
+          pending.callbacks.onFinal?.(stats);
+          this.pendingRequests.delete(requestId);
+          pending.resolve();
+          return;
+        }
+        if (data.audio) {
+          const chunk = {
+            audio: data.audio,
+            encoding: data.enc || "pcm_s16le",
+            index: data.idx,
+            sampleRate: data.sr,
+            samples: data.samples
+          };
+          pending.callbacks.onChunk?.(chunk);
+        }
+      } catch (e) {
+        console.error("Failed to parse WebSocket message:", e);
+      }
+    };
+    ws.onclose = (event) => {
+      this.wsConnection = null;
+      this.wsUrl = null;
+      for (const [id, pending] of this.pendingRequests) {
+        pending.callbacks.onClose?.();
+        if (event.code === 4001) {
+          pending.reject(new AuthenticationError("Authentication failed"));
+        } else if (event.code === 4003) {
+          pending.reject(new InsufficientCreditsError("Insufficient credits"));
+        }
+        this.pendingRequests.delete(id);
+      }
+    };
+    ws.onerror = () => {
+      const error = new KugelAudioError("WebSocket connection error");
+      for (const [id, pending] of this.pendingRequests) {
+        pending.callbacks.onError?.(error);
+        pending.reject(error);
+        this.pendingRequests.delete(id);
+      }
+    };
+  }
   /**
    * Stream audio from text via WebSocket.
+   * Uses connection pooling for faster TTFA (~180ms vs ~400ms).
+   *
+   * @param options - Generation options
+   * @param callbacks - Stream callbacks
+   * @param reuseConnection - If true (default), reuse WebSocket connection
+   */
+  stream(options, callbacks, reuseConnection = true) {
+    if (reuseConnection) {
+      return this.streamWithPooling(options, callbacks);
+    }
+    return this.streamWithoutPooling(options, callbacks);
+  }
+  /**
+   * Stream with connection pooling (fast path).
+   */
+  async streamWithPooling(options, callbacks) {
+    const ws = await this.getConnection();
+    const requestId = ++this.requestCounter;
+    return new Promise((resolve, reject) => {
+      this.pendingRequests.set(requestId, { callbacks, resolve, reject });
+      callbacks.onOpen?.();
+      ws.send(JSON.stringify({
+        text: options.text,
+        model: options.model || "kugel-1-turbo",
+        voice_id: options.voiceId,
+        cfg_scale: options.cfgScale ?? 2,
+        max_new_tokens: options.maxNewTokens ?? 2048,
+        sample_rate: options.sampleRate ?? 24e3,
+        speaker_prefix: options.speakerPrefix ?? true
+      }));
+    });
+  }
+  /**
+   * Stream without connection pooling (original behavior).
    */
-  stream(options, callbacks) {
+  streamWithoutPooling(options, callbacks) {
     return new Promise((resolve, reject) => {
       const wsUrl = this.client.ttsUrl.replace("https://", "wss://").replace("http://", "ws://");
       const url = `${wsUrl}/ws/tts?api_key=${this.client.apiKey}`;
@@ -256,7 +392,7 @@ var TTSResource = class {
         callbacks.onOpen?.();
         ws.send(JSON.stringify({
           text: options.text,
-          model: options.model || "kugel-one-turbo",
+          model: options.model || "kugel-1-turbo",
           voice_id: options.voiceId,
           cfg_scale: options.cfgScale ?? 2,
           max_new_tokens: options.maxNewTokens ?? 2048,
@@ -319,6 +455,19 @@ var TTSResource = class {
       };
     });
   }
+  /**
+   * Close the pooled WebSocket connection.
+   */
+  close() {
+    if (this.wsConnection) {
+      try {
+        this.wsConnection.close();
+      } catch {
+      }
+      this.wsConnection = null;
+      this.wsUrl = null;
+    }
+  }
   parseError(message) {
     const lower = message.toLowerCase();
     if (lower.includes("auth") || lower.includes("unauthorized")) {
@@ -351,6 +500,13 @@ var KugelAudio = class {
   get ttsUrl() {
     return this._ttsUrl;
   }
+  /**
+   * Close the client and release resources.
+   * This closes any pooled WebSocket connections.
+   */
+  close() {
+    this.tts.close();
+  }
   /**
    * Make an HTTP request to the API.
    * @internal

package/dist/index.mjs CHANGED Viewed

@@ -176,6 +176,10 @@ var VoicesResource = class {
 var TTSResource = class {
   constructor(client) {
     this.client = client;
+    this.wsConnection = null;
+    this.wsUrl = null;
+    this.pendingRequests = /* @__PURE__ */ new Map();
+    this.requestCounter = 0;
   }
   /**
    * Generate audio from text with streaming via WebSocket.
@@ -208,10 +212,142 @@ var TTSResource = class {
       rtf: finalStats ? finalStats.rtf : 0
     };
   }
+  /**
+   * Get or create a WebSocket connection for connection pooling.
+   * This avoids the ~220ms connect overhead on each request.
+   */
+  async getConnection() {
+    const wsUrl = this.client.ttsUrl.replace("https://", "wss://").replace("http://", "ws://");
+    const url = `${wsUrl}/ws/tts?api_key=${this.client.apiKey}`;
+    if (this.wsConnection && this.wsUrl === url && this.wsConnection.readyState === WebSocket.OPEN) {
+      return this.wsConnection;
+    }
+    if (this.wsConnection) {
+      try {
+        this.wsConnection.close();
+      } catch {
+      }
+      this.wsConnection = null;
+    }
+    return new Promise((resolve, reject) => {
+      const ws = new WebSocket(url);
+      ws.onopen = () => {
+        this.wsConnection = ws;
+        this.wsUrl = url;
+        this.setupMessageHandler(ws);
+        resolve(ws);
+      };
+      ws.onerror = () => {
+        reject(new KugelAudioError("WebSocket connection error"));
+      };
+    });
+  }
+  /**
+   * Setup message handler for pooled connection.
+   */
+  setupMessageHandler(ws) {
+    ws.onmessage = (event) => {
+      try {
+        const data = JSON.parse(event.data);
+        const [requestId, pending] = [...this.pendingRequests.entries()][0] || [];
+        if (!pending) return;
+        if (data.error) {
+          const error = this.parseError(data.error);
+          pending.callbacks.onError?.(error);
+          this.pendingRequests.delete(requestId);
+          pending.reject(error);
+          return;
+        }
+        if (data.final) {
+          const stats = {
+            final: true,
+            chunks: data.chunks,
+            totalSamples: data.total_samples,
+            durationMs: data.dur_ms,
+            generationMs: data.gen_ms,
+            ttfaMs: data.ttfa_ms,
+            rtf: data.rtf,
+            error: data.error
+          };
+          pending.callbacks.onFinal?.(stats);
+          this.pendingRequests.delete(requestId);
+          pending.resolve();
+          return;
+        }
+        if (data.audio) {
+          const chunk = {
+            audio: data.audio,
+            encoding: data.enc || "pcm_s16le",
+            index: data.idx,
+            sampleRate: data.sr,
+            samples: data.samples
+          };
+          pending.callbacks.onChunk?.(chunk);
+        }
+      } catch (e) {
+        console.error("Failed to parse WebSocket message:", e);
+      }
+    };
+    ws.onclose = (event) => {
+      this.wsConnection = null;
+      this.wsUrl = null;
+      for (const [id, pending] of this.pendingRequests) {
+        pending.callbacks.onClose?.();
+        if (event.code === 4001) {
+          pending.reject(new AuthenticationError("Authentication failed"));
+        } else if (event.code === 4003) {
+          pending.reject(new InsufficientCreditsError("Insufficient credits"));
+        }
+        this.pendingRequests.delete(id);
+      }
+    };
+    ws.onerror = () => {
+      const error = new KugelAudioError("WebSocket connection error");
+      for (const [id, pending] of this.pendingRequests) {
+        pending.callbacks.onError?.(error);
+        pending.reject(error);
+        this.pendingRequests.delete(id);
+      }
+    };
+  }
   /**
    * Stream audio from text via WebSocket.
+   * Uses connection pooling for faster TTFA (~180ms vs ~400ms).
+   *
+   * @param options - Generation options
+   * @param callbacks - Stream callbacks
+   * @param reuseConnection - If true (default), reuse WebSocket connection
+   */
+  stream(options, callbacks, reuseConnection = true) {
+    if (reuseConnection) {
+      return this.streamWithPooling(options, callbacks);
+    }
+    return this.streamWithoutPooling(options, callbacks);
+  }
+  /**
+   * Stream with connection pooling (fast path).
+   */
+  async streamWithPooling(options, callbacks) {
+    const ws = await this.getConnection();
+    const requestId = ++this.requestCounter;
+    return new Promise((resolve, reject) => {
+      this.pendingRequests.set(requestId, { callbacks, resolve, reject });
+      callbacks.onOpen?.();
+      ws.send(JSON.stringify({
+        text: options.text,
+        model: options.model || "kugel-1-turbo",
+        voice_id: options.voiceId,
+        cfg_scale: options.cfgScale ?? 2,
+        max_new_tokens: options.maxNewTokens ?? 2048,
+        sample_rate: options.sampleRate ?? 24e3,
+        speaker_prefix: options.speakerPrefix ?? true
+      }));
+    });
+  }
+  /**
+   * Stream without connection pooling (original behavior).
    */
-  stream(options, callbacks) {
+  streamWithoutPooling(options, callbacks) {
     return new Promise((resolve, reject) => {
       const wsUrl = this.client.ttsUrl.replace("https://", "wss://").replace("http://", "ws://");
       const url = `${wsUrl}/ws/tts?api_key=${this.client.apiKey}`;
@@ -220,7 +356,7 @@ var TTSResource = class {
         callbacks.onOpen?.();
         ws.send(JSON.stringify({
           text: options.text,
-          model: options.model || "kugel-one-turbo",
+          model: options.model || "kugel-1-turbo",
           voice_id: options.voiceId,
           cfg_scale: options.cfgScale ?? 2,
           max_new_tokens: options.maxNewTokens ?? 2048,
@@ -283,6 +419,19 @@ var TTSResource = class {
       };
     });
   }
+  /**
+   * Close the pooled WebSocket connection.
+   */
+  close() {
+    if (this.wsConnection) {
+      try {
+        this.wsConnection.close();
+      } catch {
+      }
+      this.wsConnection = null;
+      this.wsUrl = null;
+    }
+  }
   parseError(message) {
     const lower = message.toLowerCase();
     if (lower.includes("auth") || lower.includes("unauthorized")) {
@@ -315,6 +464,13 @@ var KugelAudio = class {
   get ttsUrl() {
     return this._ttsUrl;
   }
+  /**
+   * Close the client and release resources.
+   * This closes any pooled WebSocket connections.
+   */
+  close() {
+    this.tts.close();
+  }
   /**
    * Make an HTTP request to the API.
    * @internal

package/package.json CHANGED Viewed

@@ -1,15 +1,15 @@
 {
   "name": "kugelaudio",
-  "version": "0.1.1",
+  "version": "0.1.2",
   "description": "Official JavaScript/TypeScript SDK for KugelAudio TTS API",
   "main": "dist/index.js",
   "module": "dist/index.mjs",
   "types": "dist/index.d.ts",
   "exports": {
     ".": {
+      "types": "./dist/index.d.ts",
       "import": "./dist/index.mjs",
-      "require": "./dist/index.js",
-      "types": "./dist/index.d.ts"
+      "require": "./dist/index.js"
     }
   },
   "files": [

package/src/client.ts CHANGED Viewed

@@ -111,6 +111,15 @@ class VoicesResource {
  * TTS resource for text-to-speech generation.
  */
 class TTSResource {
+  private wsConnection: WebSocket | null = null;
+  private wsUrl: string | null = null;
+  private pendingRequests: Map<number, {
+    callbacks: StreamCallbacks;
+    resolve: () => void;
+    reject: (error: Error) => void;
+  }> = new Map();
+  private requestCounter = 0;
   constructor(private client: KugelAudio) {}
   /**
@@ -149,10 +158,185 @@ class TTSResource {
     };
   }
+  /**
+   * Get or create a WebSocket connection for connection pooling.
+   * This avoids the ~220ms connect overhead on each request.
+   */
+  private async getConnection(): Promise<WebSocket> {
+    const wsUrl = this.client.ttsUrl
+      .replace('https://', 'wss://')
+      .replace('http://', 'ws://');
+    const url = `${wsUrl}/ws/tts?api_key=${this.client.apiKey}`;
+    // Return existing connection if valid
+    if (
+      this.wsConnection &&
+      this.wsUrl === url &&
+      this.wsConnection.readyState === WebSocket.OPEN
+    ) {
+      return this.wsConnection;
+    }
+    // Close old connection if URL changed
+    if (this.wsConnection) {
+      try {
+        this.wsConnection.close();
+      } catch {
+        // Ignore close errors
+      }
+      this.wsConnection = null;
+    }
+    // Create new connection
+    return new Promise((resolve, reject) => {
+      const ws = new WebSocket(url);
+      ws.onopen = () => {
+        this.wsConnection = ws;
+        this.wsUrl = url;
+        this.setupMessageHandler(ws);
+        resolve(ws);
+      };
+      ws.onerror = () => {
+        reject(new KugelAudioError('WebSocket connection error'));
+      };
+    });
+  }
+  /**
+   * Setup message handler for pooled connection.
+   */
+  private setupMessageHandler(ws: WebSocket): void {
+    ws.onmessage = (event) => {
+      try {
+        const data = JSON.parse(event.data);
+        // Get the current pending request (we process one at a time)
+        const [requestId, pending] = [...this.pendingRequests.entries()][0] || [];
+        if (!pending) return;
+        if (data.error) {
+          const error = this.parseError(data.error);
+          pending.callbacks.onError?.(error);
+          this.pendingRequests.delete(requestId);
+          pending.reject(error);
+          return;
+        }
+        if (data.final) {
+          const stats: GenerationStats = {
+            final: true,
+            chunks: data.chunks,
+            totalSamples: data.total_samples,
+            durationMs: data.dur_ms,
+            generationMs: data.gen_ms,
+            ttfaMs: data.ttfa_ms,
+            rtf: data.rtf,
+            error: data.error,
+          };
+          pending.callbacks.onFinal?.(stats);
+          this.pendingRequests.delete(requestId);
+          pending.resolve();
+          return;
+        }
+        if (data.audio) {
+          const chunk: AudioChunk = {
+            audio: data.audio,
+            encoding: data.enc || 'pcm_s16le',
+            index: data.idx,
+            sampleRate: data.sr,
+            samples: data.samples,
+          };
+          pending.callbacks.onChunk?.(chunk);
+        }
+      } catch (e) {
+        console.error('Failed to parse WebSocket message:', e);
+      }
+    };
+    ws.onclose = (event) => {
+      // Clear connection pool
+      this.wsConnection = null;
+      this.wsUrl = null;
+      // Reject all pending requests
+      for (const [id, pending] of this.pendingRequests) {
+        pending.callbacks.onClose?.();
+        if (event.code === 4001) {
+          pending.reject(new AuthenticationError('Authentication failed'));
+        } else if (event.code === 4003) {
+          pending.reject(new InsufficientCreditsError('Insufficient credits'));
+        }
+        this.pendingRequests.delete(id);
+      }
+    };
+    ws.onerror = () => {
+      // Reject all pending requests
+      const error = new KugelAudioError('WebSocket connection error');
+      for (const [id, pending] of this.pendingRequests) {
+        pending.callbacks.onError?.(error);
+        pending.reject(error);
+        this.pendingRequests.delete(id);
+      }
+    };
+  }
   /**
    * Stream audio from text via WebSocket.
+   * Uses connection pooling for faster TTFA (~180ms vs ~400ms).
+   *
+   * @param options - Generation options
+   * @param callbacks - Stream callbacks
+   * @param reuseConnection - If true (default), reuse WebSocket connection
    */
-  stream(options: GenerateOptions, callbacks: StreamCallbacks): Promise<void> {
+  stream(
+    options: GenerateOptions,
+    callbacks: StreamCallbacks,
+    reuseConnection = true
+  ): Promise<void> {
+    if (reuseConnection) {
+      return this.streamWithPooling(options, callbacks);
+    }
+    return this.streamWithoutPooling(options, callbacks);
+  }
+  /**
+   * Stream with connection pooling (fast path).
+   */
+  private async streamWithPooling(
+    options: GenerateOptions,
+    callbacks: StreamCallbacks
+  ): Promise<void> {
+    const ws = await this.getConnection();
+    const requestId = ++this.requestCounter;
+    return new Promise((resolve, reject) => {
+      this.pendingRequests.set(requestId, { callbacks, resolve, reject });
+      callbacks.onOpen?.();
+      ws.send(JSON.stringify({
+        text: options.text,
+        model: options.model || 'kugel-1-turbo',
+        voice_id: options.voiceId,
+        cfg_scale: options.cfgScale ?? 2.0,
+        max_new_tokens: options.maxNewTokens ?? 2048,
+        sample_rate: options.sampleRate ?? 24000,
+        speaker_prefix: options.speakerPrefix ?? true,
+      }));
+    });
+  }
+  /**
+   * Stream without connection pooling (original behavior).
+   */
+  private streamWithoutPooling(
+    options: GenerateOptions,
+    callbacks: StreamCallbacks
+  ): Promise<void> {
     return new Promise((resolve, reject) => {
       const wsUrl = this.client.ttsUrl
         .replace('https://', 'wss://')
@@ -166,7 +350,7 @@ class TTSResource {
         // Send TTS request
         ws.send(JSON.stringify({
           text: options.text,
-          model: options.model || 'kugel-one-turbo',
+          model: options.model || 'kugel-1-turbo',
           voice_id: options.voiceId,
           cfg_scale: options.cfgScale ?? 2.0,
           max_new_tokens: options.maxNewTokens ?? 2048,
@@ -236,6 +420,21 @@ class TTSResource {
     });
   }
+  /**
+   * Close the pooled WebSocket connection.
+   */
+  close(): void {
+    if (this.wsConnection) {
+      try {
+        this.wsConnection.close();
+      } catch {
+        // Ignore close errors
+      }
+      this.wsConnection = null;
+      this.wsUrl = null;
+    }
+  }
   private parseError(message: string): Error {
     const lower = message.toLowerCase();
     if (lower.includes('auth') || lower.includes('unauthorized')) {
@@ -261,10 +460,16 @@ class TTSResource {
  * // List voices
  * const voices = await client.voices.list();
  *
- * // Generate audio
+ * // Generate audio with fast model (1.5B params)
  * const audio = await client.tts.generate({
  *   text: 'Hello, world!',
- *   model: 'kugel-one-turbo',
+ *   model: 'kugel-1-turbo',
+ * });
+ *
+ * // Generate audio with premium model (7B params)
+ * const audio = await client.tts.generate({
+ *   text: 'Hello, world!',
+ *   model: 'kugel-1',
  * });
  * ```
  */
@@ -307,6 +512,14 @@ export class KugelAudio {
     return this._ttsUrl;
   }
+  /**
+   * Close the client and release resources.
+   * This closes any pooled WebSocket connections.
+   */
+  close(): void {
+    this.tts.close();
+  }
   /**
    * Make an HTTP request to the API.
    * @internal

package/src/index.ts CHANGED Viewed

@@ -18,13 +18,13 @@
  * // Generate audio (non-streaming)
  * const audio = await client.tts.generate({
  *   text: 'Hello, world!',
- *   model: 'kugel-one-turbo',
+ *   model: 'kugel-1-turbo',
  *   voiceId: 123,
  * });
  *
  * // Generate audio (streaming)
  * await client.tts.stream(
- *   { text: 'Hello, world!', model: 'kugel-one-turbo' },
+ *   { text: 'Hello, world!', model: 'kugel-1-turbo' },
  *   {
  *     onChunk: (chunk) => {
  *       // Process audio chunk

package/src/types.ts CHANGED Viewed

@@ -53,7 +53,7 @@ export interface Voice {
 export interface GenerateOptions {
   /** Text to synthesize */
   text: string;
-  /** Model to use (default: 'kugel-one-turbo') */
+  /** Model to use: 'kugel-1-turbo' (1.5B, fast) or 'kugel-1' (7B, premium). Default: 'kugel-1-turbo' */
   model?: string;
   /** Voice ID to use */
   voiceId?: number;