npm - @mastra/voice-deepgram - Versions diffs - 0.1.0-alpha.2 - Mend

@mastra/voice-deepgram 0.1.0-alpha.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (15) hide show

package/.turbo/turbo-build.log +18 -0
package/CHANGELOG.md +22 -0
package/LICENSE +44 -0
package/README.md +71 -0
package/__fixtures__/voice-test.m4a +0 -0
package/dist/_tsup-dts-rollup.d.ts +50 -0
package/dist/index.d.ts +4 -0
package/dist/index.js +163 -0
package/eslint.config.js +6 -0
package/package.json +37 -0
package/src/index.test.ts +134 -0
package/src/index.ts +190 -0
package/src/voices.ts +28 -0
package/tsconfig.json +5 -0
package/vitest.config.ts +9 -0

package/.turbo/turbo-build.log ADDED Viewed

@@ -0,0 +1,18 @@
+> @mastra/voice-deepgram@0.1.0-alpha.2 build /home/runner/work/mastra/mastra/voice/deepgram
+> tsup src/index.ts --format esm --experimental-dts --clean --treeshake
+[34mCLI[39m Building entry: src/index.ts
+[34mCLI[39m Using tsconfig: tsconfig.json
+[34mCLI[39m tsup v8.3.6
+[34mTSC[39m Build start
+[32mTSC[39m ⚡️ Build success in 6794ms
+[34mDTS[39m Build start
+[34mCLI[39m Target: es2022
+Analysis will use the bundled TypeScript version 5.7.3
+[36mWriting package typings: /home/runner/work/mastra/mastra/voice/deepgram/dist/_tsup-dts-rollup.d.ts[39m
+[32mDTS[39m ⚡️ Build success in 4973ms
+[34mCLI[39m Cleaning output folder
+[34mESM[39m Build start
+[32mESM[39m [1mdist/index.js [22m[32m4.50 KB[39m
+[32mESM[39m ⚡️ Build success in 262ms

package/CHANGELOG.md ADDED Viewed

@@ -0,0 +1,22 @@
+# Changelog
+## 0.1.0-alpha.2
+### Patch Changes
+- abe4600: deprecate @mastra/speech-deepgram for @mastra/voice-deepgram
+- Updated dependencies [7fceae1]
+- Updated dependencies [f626fbb]
+  - @mastra/core@0.4.2-alpha.0
+## 0.1.0 (2024-XX-XX)
+This package replaces the deprecated @mastra/speech-deepgram package. All functionality has been migrated to this new package with a more consistent naming scheme.
+### Changes from @mastra/speech-deepgram
+- Package renamed from @mastra/speech-deepgram to @mastra/voice-deepgram
+- All functionality remains the same
+- Import paths should be updated from '@mastra/speech-deepgram' to '@mastra/voice-deepgram'
+For a complete history of changes prior to the rename, please see the changelog of the original package.

package/LICENSE ADDED Viewed

@@ -0,0 +1,44 @@
+Elastic License 2.0 (ELv2)
+**Acceptance**
+By using the software, you agree to all of the terms and conditions below.
+**Copyright License**
+The licensor grants you a non-exclusive, royalty-free, worldwide, non-sublicensable, non-transferable license to use, copy, distribute, make available, and prepare derivative works of the software, in each case subject to the limitations and conditions below
+**Limitations**
+You may not provide the software to third parties as a hosted or managed service, where the service provides users with access to any substantial set of the features or functionality of the software.
+You may not move, change, disable, or circumvent the license key functionality in the software, and you may not remove or obscure any functionality in the software that is protected by the license key.
+You may not alter, remove, or obscure any licensing, copyright, or other notices of the licensor in the software. Any use of the licensor’s trademarks is subject to applicable law.
+**Patents**
+The licensor grants you a license, under any patent claims the licensor can license, or becomes able to license, to make, have made, use, sell, offer for sale, import and have imported the software, in each case subject to the limitations and conditions in this license. This license does not cover any patent claims that you cause to be infringed by modifications or additions to the software. If you or your company make any written claim that the software infringes or contributes to infringement of any patent, your patent license for the software granted under these terms ends immediately. If your company makes such a claim, your patent license ends immediately for work on behalf of your company.
+**Notices**
+You must ensure that anyone who gets a copy of any part of the software from you also gets a copy of these terms.
+If you modify the software, you must include in any modified copies of the software prominent notices stating that you have modified the software.
+**No Other Rights**
+These terms do not imply any licenses other than those expressly granted in these terms.
+**Termination**
+If you use the software in violation of these terms, such use is not licensed, and your licenses will automatically terminate. If the licensor provides you with a notice of your violation, and you cease all violation of this license no later than 30 days after you receive that notice, your licenses will be reinstated retroactively. However, if you violate these terms after such reinstatement, any additional violation of these terms will cause your licenses to terminate automatically and permanently.
+**No Liability**
+As far as the law allows, the software comes as is, without any warranty or condition, and the licensor will not be liable to you for any damages arising out of these terms or the use or nature of the software, under any kind of legal claim.
+**Definitions**
+The _licensor_ is the entity offering these terms, and the _software_ is the software the licensor makes available under these terms, including any portion of it.
+_you_ refers to the individual or entity agreeing to these terms.
+_your company_ is any legal entity, sole proprietorship, or other kind of organization that you work for, plus all organizations that have control over, are under the control of, or are under common control with that organization. _control_ means ownership of substantially all the assets of an entity, or the power to direct its management and policies by vote, contract, or otherwise. Control can be direct or indirect.
+_your licenses_ are all the licenses granted to you for the software under these terms.
+_use_ means anything you do with the software requiring one of your licenses.
+_trademark_ means trademarks, service marks, and similar rights.

package/README.md ADDED Viewed

@@ -0,0 +1,71 @@
+# @mastra/voice-deepgram
+Deepgram voice integration for Mastra, providing both Text-to-Speech (TTS) and Speech-to-Text (STT) capabilities using Deepgram's advanced AI models.
+## Installation
+```bash
+npm install @mastra/voice-deepgram
+```
+## Configuration
+The module requires a Deepgram API key, which can be provided through environment variables or directly in the configuration:
+```bash
+DEEPGRAM_API_KEY=your_api_key
+```
+## Usage
+```typescript
+import { DeepgramVoice } from '@mastra/voice-deepgram';
+// Create voice with both speech and listening capabilities
+const voice = new DeepgramVoice({
+  speechModel: {
+    name: 'aura-asteria-en', // Default voice
+    apiKey: 'your-api-key', // Optional, can use DEEPGRAM_API_KEY env var
+  },
+  listeningModel: {
+    name: 'nova', // Optional, specify a listening model
+    apiKey: 'your-api-key', // Optional, can use DEEPGRAM_API_KEY env var
+  },
+  speaker: 'aura-athena-en', // Optional, specify a speaker voice
+});
+// List available voices
+const voices = await voice.getSpeakers();
+// Generate speech
+const audioStream = await voice.speak('Hello from Mastra!', {
+  speaker: 'aura-athena-en', // Optional: override default speaker
+  speed: 1.0, // Optional: adjust speech speed
+});
+// Convert speech to text
+const text = await voice.listen(audioStream);
+```
+## Features
+- High-quality Text-to-Speech synthesis
+- Accurate Speech-to-Text transcription
+## Voice Options
+Deepgram provides several AI voices with different characteristics:
+- aura-asteria-en (Female, American)
+- aura-athena-en (Female, American)
+- aura-zeus-en (Male, American)
+- aura-hera-en (Female, American)
+- aura-orion-en (Male, American)
+View the complete list in the `voices.ts` file or [Deepgram's documentation](https://developers.deepgram.com/docs/tts-models).
+### New Features
+- **Speaker Selection**: You can now specify a speaker voice when initializing the `DeepgramVoice` class. This allows for more personalized speech generation.
+- **Updated `speak` Method**: The `speak` method now supports an optional `speaker` parameter in the options, allowing you to dynamically choose the voice for speech synthesis.

package/__fixtures__/voice-test.m4a ADDED Viewed

Binary file

package/dist/_tsup-dts-rollup.d.ts ADDED Viewed

@@ -0,0 +1,50 @@
+import { MastraVoice } from '@mastra/core/voice';
+/**
+ * List of available Deepgram models for text-to-speech and speech-to-text
+ */
+export declare const DEEPGRAM_MODELS: readonly ["aura", "whisper", "base", "enhanced", "nova", "nova-2", "nova-3"];
+/**
+ * List of available Deepgram voice models for text-to-speech
+ * Each voice is designed for specific use cases and languages
+ * Format: {name}-{language} (e.g. asteria-en)
+ */
+export declare const DEEPGRAM_VOICES: readonly ["asteria-en", "luna-en", "stella-en", "athena-en", "hera-en", "orion-en", "arcas-en", "perseus-en", "angus-en", "orpheus-en", "helios-en", "zeus-en"];
+declare type DeepgramModel = (typeof DEEPGRAM_MODELS)[number];
+export { DeepgramModel }
+export { DeepgramModel as DeepgramModel_alias_1 }
+export declare class DeepgramVoice extends MastraVoice {
+    private speechClient?;
+    private listeningClient?;
+    constructor({ speechModel, listeningModel, speaker, }?: {
+        speechModel?: DeepgramVoiceConfig;
+        listeningModel?: DeepgramVoiceConfig;
+        speaker?: DeepgramVoiceId;
+    });
+    getSpeakers(): Promise<{
+        voiceId: "asteria-en" | "luna-en" | "stella-en" | "athena-en" | "hera-en" | "orion-en" | "arcas-en" | "perseus-en" | "angus-en" | "orpheus-en" | "helios-en" | "zeus-en";
+    }[]>;
+    speak(input: string | NodeJS.ReadableStream, options?: {
+        speaker?: string;
+        [key: string]: any;
+    }): Promise<NodeJS.ReadableStream>;
+    listen(audioStream: NodeJS.ReadableStream, options?: {
+        [key: string]: any;
+    }): Promise<string>;
+}
+export declare interface DeepgramVoiceConfig {
+    name?: DeepgramModel;
+    apiKey?: string;
+    properties?: Record<string, any>;
+    language?: string;
+}
+declare type DeepgramVoiceId = (typeof DEEPGRAM_VOICES)[number];
+export { DeepgramVoiceId }
+export { DeepgramVoiceId as DeepgramVoiceId_alias_1 }
+export { }

package/dist/index.d.ts ADDED Viewed

@@ -0,0 +1,4 @@
+export { DeepgramVoice } from './_tsup-dts-rollup.js';
+export { DeepgramVoiceConfig } from './_tsup-dts-rollup.js';
+export { DeepgramVoiceId } from './_tsup-dts-rollup.js';
+export { DeepgramModel } from './_tsup-dts-rollup.js';

package/dist/index.js ADDED Viewed

@@ -0,0 +1,163 @@
+import { createClient } from '@deepgram/sdk';
+import { MastraVoice } from '@mastra/core/voice';
+import { PassThrough } from 'stream';
+// src/index.ts
+// src/voices.ts
+var DEEPGRAM_VOICES = [
+  "asteria-en",
+  "luna-en",
+  "stella-en",
+  "athena-en",
+  "hera-en",
+  "orion-en",
+  "arcas-en",
+  "perseus-en",
+  "angus-en",
+  "orpheus-en",
+  "helios-en",
+  "zeus-en"
+];
+// src/index.ts
+var DeepgramVoice = class extends MastraVoice {
+  speechClient;
+  listeningClient;
+  constructor({
+    speechModel,
+    listeningModel,
+    speaker
+  } = {}) {
+    const defaultApiKey = process.env.DEEPGRAM_API_KEY;
+    const defaultSpeechModel = {
+      name: "aura",
+      apiKey: defaultApiKey
+    };
+    const defaultListeningModel = {
+      name: "nova",
+      apiKey: defaultApiKey
+    };
+    super({
+      speechModel: {
+        name: speechModel?.name ?? defaultSpeechModel.name,
+        apiKey: speechModel?.apiKey ?? defaultSpeechModel.apiKey
+      },
+      listeningModel: {
+        name: listeningModel?.name ?? defaultListeningModel.name,
+        apiKey: listeningModel?.apiKey ?? defaultListeningModel.apiKey
+      },
+      speaker
+    });
+    const speechApiKey = speechModel?.apiKey || defaultApiKey;
+    const listeningApiKey = listeningModel?.apiKey || defaultApiKey;
+    console.log("speechApiKey", speechApiKey);
+    console.log("listeningApiKey", listeningApiKey);
+    if (!speechApiKey && !listeningApiKey) {
+      throw new Error("At least one of DEEPGRAM_API_KEY, speechModel.apiKey, or listeningModel.apiKey must be set");
+    }
+    if (speechApiKey) {
+      this.speechClient = createClient(speechApiKey);
+    }
+    if (listeningApiKey) {
+      this.listeningClient = createClient(listeningApiKey);
+    }
+    this.speaker = speaker || "asteria-en";
+  }
+  async getSpeakers() {
+    return this.traced(async () => {
+      return DEEPGRAM_VOICES.map((voice) => ({
+        voiceId: voice
+      }));
+    }, "voice.deepgram.getSpeakers")();
+  }
+  async speak(input, options) {
+    if (!this.speechClient) {
+      throw new Error("Deepgram speech client not configured");
+    }
+    let text;
+    if (typeof input !== "string") {
+      const chunks = [];
+      for await (const chunk of input) {
+        chunks.push(Buffer.from(chunk));
+      }
+      text = Buffer.concat(chunks).toString("utf-8");
+    } else {
+      text = input;
+    }
+    if (text.trim().length === 0) {
+      throw new Error("Input text is empty");
+    }
+    return this.traced(async () => {
+      if (!this.speechClient) {
+        throw new Error("No speech client configured");
+      }
+      let model;
+      if (options?.speaker) {
+        model = this.speechModel?.name + "-" + options.speaker;
+      } else if (this.speaker) {
+        model = this.speechModel?.name + "-" + this.speaker;
+      }
+      const speakClient = this.speechClient.speak;
+      const response = await speakClient.request(
+        { text },
+        {
+          model,
+          ...options
+        }
+      );
+      const webStream = await response.getStream();
+      if (!webStream) {
+        throw new Error("No stream returned from Deepgram");
+      }
+      const reader = webStream.getReader();
+      const nodeStream = new PassThrough();
+      (async () => {
+        try {
+          while (true) {
+            const { done, value } = await reader.read();
+            if (done) {
+              nodeStream.end();
+              break;
+            }
+            nodeStream.write(value);
+          }
+        } catch (error) {
+          nodeStream.destroy(error);
+        }
+      })().catch((error) => {
+        nodeStream.destroy(error);
+      });
+      return nodeStream;
+    }, "voice.deepgram.speak")();
+  }
+  async listen(audioStream, options) {
+    if (!this.listeningClient) {
+      throw new Error("Deepgram listening client not configured");
+    }
+    const chunks = [];
+    for await (const chunk of audioStream) {
+      chunks.push(Buffer.from(chunk));
+    }
+    const buffer = Buffer.concat(chunks);
+    return this.traced(async () => {
+      if (!this.listeningClient) {
+        throw new Error("No listening client configured");
+      }
+      const { result, error } = await this.listeningClient.listen.prerecorded.transcribeFile(buffer, {
+        model: this.listeningModel?.name,
+        ...options
+      });
+      if (error) {
+        throw error;
+      }
+      const transcript = result.results?.channels?.[0]?.alternatives?.[0]?.transcript;
+      if (!transcript) {
+        throw new Error("No transcript found in Deepgram response");
+      }
+      return transcript;
+    }, "voice.deepgram.listen")();
+  }
+};
+export { DeepgramVoice };

package/eslint.config.js ADDED Viewed

@@ -0,0 +1,6 @@
+import { createConfig } from '@internal/lint/eslint';
+const config = await createConfig();
+/** @type {import("eslint").Linter.Config[]} */
+export default [...config];

package/package.json ADDED Viewed

@@ -0,0 +1,37 @@
+{
+  "name": "@mastra/voice-deepgram",
+  "version": "0.1.0-alpha.2",
+  "description": "Mastra Deepgram voice integration",
+  "type": "module",
+  "main": "dist/index.js",
+  "types": "dist/index.d.ts",
+  "exports": {
+    ".": {
+      "import": {
+        "types": "./dist/index.d.ts",
+        "default": "./dist/index.js"
+      }
+    },
+    "./package.json": "./package.json"
+  },
+  "dependencies": {
+    "@deepgram/sdk": "^3.9.0",
+    "zod": "^3.24.1",
+    "@mastra/core": "^0.4.2-alpha.0"
+  },
+  "devDependencies": {
+    "@microsoft/api-extractor": "^7.49.2",
+    "@types/node": "^22.13.1",
+    "tsup": "^8.3.6",
+    "typescript": "^5.7.3",
+    "vitest": "^2.1.8",
+    "eslint": "^9.20.1",
+    "@internal/lint": "0.0.0"
+  },
+  "scripts": {
+    "build": "tsup src/index.ts --format esm --experimental-dts --clean --treeshake",
+    "build:watch": "pnpm build --watch",
+    "test": "vitest run",
+    "lint": "eslint ."
+  }
+}

package/src/index.test.ts ADDED Viewed

@@ -0,0 +1,134 @@
+import { writeFileSync, mkdirSync, createReadStream } from 'fs';
+import path from 'path';
+import { PassThrough } from 'stream';
+import { describe, expect, it, beforeAll } from 'vitest';
+import { DeepgramVoice } from './index.js';
+describe('DeepgramVoice Integration Tests', () => {
+  let voice: DeepgramVoice;
+  const outputDir = path.join(process.cwd(), 'test-outputs');
+  beforeAll(() => {
+    try {
+      mkdirSync(outputDir, { recursive: true });
+    } catch (err) {
+      console.log('Directory already exists: ', err);
+    }
+    voice = new DeepgramVoice({
+      speechModel: {
+        name: 'aura',
+      },
+      listeningModel: {
+        name: 'whisper',
+      },
+      speaker: 'asteria-en',
+    });
+  });
+  describe('getSpeakers', () => {
+    it('should list available voices', async () => {
+      const speakers = await voice.getSpeakers();
+      const expectedVoiceIds = ['asteria-en', 'stella-en', 'luna-en'];
+      expectedVoiceIds.forEach(voiceId => {
+        expect(speakers.some(s => s.voiceId === voiceId)).toBe(true);
+      });
+    });
+  });
+  describe('speak', () => {
+    it('should generate audio and save to file', async () => {
+      const audioResult = await voice.speak('Hello World', {
+        text: 'Hello World',
+      });
+      const chunks: Buffer[] = [];
+      for await (const chunk of audioResult) {
+        chunks.push(Buffer.isBuffer(chunk) ? chunk : Buffer.from(chunk));
+      }
+      const audioBuffer = Buffer.concat(chunks);
+      const outputPath = path.join(outputDir, 'deepgram-speech-test.mp3');
+      writeFileSync(outputPath, audioBuffer);
+      expect(audioBuffer.length).toBeGreaterThan(0);
+    }, 10000);
+    it('should work with different parameters', async () => {
+      const audioResult = await voice.speak('Hello World', {
+        text: 'Test with parameters',
+        speaker: 'luna-en',
+      });
+      const chunks: Buffer[] = [];
+      for await (const chunk of audioResult) {
+        chunks.push(Buffer.isBuffer(chunk) ? chunk : Buffer.from(chunk));
+      }
+      const audioBuffer = Buffer.concat(chunks);
+      const outputPath = path.join(outputDir, 'deepgram-speech-test-params.mp3');
+      writeFileSync(outputPath, audioBuffer);
+      expect(audioBuffer.length).toBeGreaterThan(0);
+    }, 10000);
+  });
+  // Error cases
+  describe('error handling', () => {
+    it('should handle invalid voice names', async () => {
+      await expect(voice.speak('Test', { speaker: 'invalid_voice' })).rejects.toThrow();
+    });
+    it('should handle empty text', async () => {
+      await expect(voice.speak('', { speaker: 'asteria-en' })).rejects.toThrow('Input text is empty');
+    });
+    it('should handle whitespace-only text', async () => {
+      await expect(voice.speak('   \n\t  ', { speaker: 'asteria-en' })).rejects.toThrow('Input text is empty');
+    });
+  });
+  describe('listen', () => {
+    it('should transcribe audio buffer', async () => {
+      // First generate some audio to transcribe
+      const audioResult = await voice.speak('This is a test of transcription');
+      // Collect audio chunks
+      const chunks: Buffer[] = [];
+      for await (const chunk of audioResult) {
+        chunks.push(Buffer.isBuffer(chunk) ? chunk : Buffer.from(chunk));
+      }
+      const audioBuffer = Buffer.concat(chunks);
+      // Create stream from the buffer
+      const stream = new PassThrough();
+      stream.end(audioBuffer);
+      const result = await voice.listen(stream);
+      expect(typeof result).toBe('string');
+      expect(result.toLowerCase()).toContain('test');
+      expect(result.toLowerCase()).toContain('transcription');
+    }, 15000);
+    it('should transcribe audio from fixture file', async () => {
+      const fixturePath = path.join(process.cwd(), '__fixtures__', 'voice-test.m4a');
+      const audioStream = createReadStream(fixturePath);
+      console.log('listening to audio stream');
+      const text = await voice.listen(audioStream, {
+        filetype: 'm4a',
+      });
+      console.log('text', text);
+      expect(text).toBeTruthy();
+      console.log(text);
+      expect(typeof text).toBe('string');
+      expect(text.length).toBeGreaterThan(0);
+    }, 15000);
+    it('should handle invalid audio', async () => {
+      const invalidAudio = Buffer.from('not valid audio');
+      const stream = new PassThrough();
+      stream.end(invalidAudio);
+      await expect(voice.listen(stream)).rejects.toThrow();
+    });
+  });
+});

package/src/index.ts ADDED Viewed

@@ -0,0 +1,190 @@
+import { createClient } from '@deepgram/sdk';
+import { MastraVoice } from '@mastra/core/voice';
+import { PassThrough } from 'stream';
+import { DEEPGRAM_VOICES } from './voices';
+import type { DeepgramVoiceId, DeepgramModel } from './voices';
+interface DeepgramVoiceConfig {
+  name?: DeepgramModel;
+  apiKey?: string;
+  properties?: Record<string, any>;
+  language?: string;
+}
+export class DeepgramVoice extends MastraVoice {
+  private speechClient?: ReturnType<typeof createClient>;
+  private listeningClient?: ReturnType<typeof createClient>;
+  constructor({
+    speechModel,
+    listeningModel,
+    speaker,
+  }: { speechModel?: DeepgramVoiceConfig; listeningModel?: DeepgramVoiceConfig; speaker?: DeepgramVoiceId } = {}) {
+    const defaultApiKey = process.env.DEEPGRAM_API_KEY;
+    const defaultSpeechModel = {
+      name: 'aura',
+      apiKey: defaultApiKey,
+    };
+    const defaultListeningModel = {
+      name: 'nova',
+      apiKey: defaultApiKey,
+    };
+    super({
+      speechModel: {
+        name: speechModel?.name ?? defaultSpeechModel.name,
+        apiKey: speechModel?.apiKey ?? defaultSpeechModel.apiKey,
+      },
+      listeningModel: {
+        name: listeningModel?.name ?? defaultListeningModel.name,
+        apiKey: listeningModel?.apiKey ?? defaultListeningModel.apiKey,
+      },
+      speaker,
+    });
+    const speechApiKey = speechModel?.apiKey || defaultApiKey;
+    const listeningApiKey = listeningModel?.apiKey || defaultApiKey;
+    console.log('speechApiKey', speechApiKey);
+    console.log('listeningApiKey', listeningApiKey);
+    if (!speechApiKey && !listeningApiKey) {
+      throw new Error('At least one of DEEPGRAM_API_KEY, speechModel.apiKey, or listeningModel.apiKey must be set');
+    }
+    if (speechApiKey) {
+      this.speechClient = createClient(speechApiKey);
+    }
+    if (listeningApiKey) {
+      this.listeningClient = createClient(listeningApiKey);
+    }
+    this.speaker = speaker || 'asteria-en';
+  }
+  async getSpeakers() {
+    return this.traced(async () => {
+      return DEEPGRAM_VOICES.map(voice => ({
+        voiceId: voice,
+      }));
+    }, 'voice.deepgram.getSpeakers')();
+  }
+  async speak(
+    input: string | NodeJS.ReadableStream,
+    options?: {
+      speaker?: string;
+      [key: string]: any;
+    },
+  ): Promise<NodeJS.ReadableStream> {
+    if (!this.speechClient) {
+      throw new Error('Deepgram speech client not configured');
+    }
+    let text: string;
+    if (typeof input !== 'string') {
+      const chunks: Buffer[] = [];
+      for await (const chunk of input) {
+        chunks.push(Buffer.from(chunk));
+      }
+      text = Buffer.concat(chunks).toString('utf-8');
+    } else {
+      text = input;
+    }
+    if (text.trim().length === 0) {
+      throw new Error('Input text is empty');
+    }
+    return this.traced(async () => {
+      if (!this.speechClient) {
+        throw new Error('No speech client configured');
+      }
+      let model;
+      if (options?.speaker) {
+        model = this.speechModel?.name + '-' + options.speaker;
+      } else if (this.speaker) {
+        model = this.speechModel?.name + '-' + this.speaker;
+      }
+      const speakClient = this.speechClient.speak;
+      const response = await speakClient.request(
+        { text },
+        {
+          model,
+          ...options,
+        },
+      );
+      const webStream = await response.getStream();
+      if (!webStream) {
+        throw new Error('No stream returned from Deepgram');
+      }
+      const reader = webStream.getReader();
+      const nodeStream = new PassThrough();
+      // Add error handling for the stream processing
+      (async () => {
+        try {
+          while (true) {
+            const { done, value } = await reader.read();
+            if (done) {
+              nodeStream.end();
+              break;
+            }
+            nodeStream.write(value);
+          }
+        } catch (error) {
+          nodeStream.destroy(error as Error);
+        }
+      })().catch(error => {
+        nodeStream.destroy(error as Error);
+      });
+      return nodeStream;
+    }, 'voice.deepgram.speak')();
+  }
+  async listen(
+    audioStream: NodeJS.ReadableStream,
+    options?: {
+      [key: string]: any;
+    },
+  ): Promise<string> {
+    if (!this.listeningClient) {
+      throw new Error('Deepgram listening client not configured');
+    }
+    const chunks: Buffer[] = [];
+    for await (const chunk of audioStream) {
+      chunks.push(Buffer.from(chunk));
+    }
+    const buffer = Buffer.concat(chunks);
+    return this.traced(async () => {
+      if (!this.listeningClient) {
+        throw new Error('No listening client configured');
+      }
+      const { result, error } = await this.listeningClient.listen.prerecorded.transcribeFile(buffer, {
+        model: this.listeningModel?.name,
+        ...options,
+      });
+      if (error) {
+        throw error;
+      }
+      const transcript = result.results?.channels?.[0]?.alternatives?.[0]?.transcript;
+      if (!transcript) {
+        throw new Error('No transcript found in Deepgram response');
+      }
+      return transcript;
+    }, 'voice.deepgram.listen')();
+  }
+}
+export type { DeepgramVoiceConfig, DeepgramVoiceId, DeepgramModel };

package/src/voices.ts ADDED Viewed

@@ -0,0 +1,28 @@
+/**
+ * List of available Deepgram voice models for text-to-speech
+ * Each voice is designed for specific use cases and languages
+ * Format: {name}-{language} (e.g. asteria-en)
+ */
+export const DEEPGRAM_VOICES = [
+  'asteria-en',
+  'luna-en',
+  'stella-en',
+  'athena-en',
+  'hera-en',
+  'orion-en',
+  'arcas-en',
+  'perseus-en',
+  'angus-en',
+  'orpheus-en',
+  'helios-en',
+  'zeus-en',
+] as const;
+export type DeepgramVoiceId = (typeof DEEPGRAM_VOICES)[number];
+/**
+ * List of available Deepgram models for text-to-speech and speech-to-text
+ */
+export const DEEPGRAM_MODELS = ['aura', 'whisper', 'base', 'enhanced', 'nova', 'nova-2', 'nova-3'] as const;
+export type DeepgramModel = (typeof DEEPGRAM_MODELS)[number];

package/tsconfig.json ADDED Viewed

@@ -0,0 +1,5 @@
+{
+  "extends": "../../tsconfig.node.json",
+  "include": ["src/**/*"],
+  "exclude": ["node_modules", "**/*.test.ts"]
+}

package/vitest.config.ts ADDED Viewed

@@ -0,0 +1,9 @@
+import { defineConfig } from 'vitest/config';
+export default defineConfig({
+  test: {
+    globals: true,
+    environment: 'node',
+    include: ['src/**/*.test.ts'],
+  },
+});