@mastra/mcp-docs-server 1.1.7-alpha.0 → 1.1.8-alpha.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.docs/docs/agents/agent-approval.md +61 -31
- package/.docs/docs/agents/supervisor-agents.md +1 -1
- package/.docs/docs/getting-started/manual-install.md +1 -1
- package/.docs/docs/index.md +68 -24
- package/.docs/docs/mastra-cloud/setup.md +1 -1
- package/.docs/docs/memory/observational-memory.md +9 -0
- package/.docs/docs/memory/semantic-recall.md +17 -1
- package/.docs/docs/workspace/skills.md +7 -5
- package/.docs/guides/deployment/aws-lambda.md +76 -165
- package/.docs/guides/deployment/azure-app-services.md +38 -61
- package/.docs/guides/deployment/cloudflare.md +1 -1
- package/.docs/guides/deployment/netlify.md +1 -1
- package/.docs/guides/deployment/vercel.md +1 -1
- package/.docs/models/gateways/netlify.md +5 -1
- package/.docs/models/index.md +1 -1
- package/.docs/models/providers/anthropic.md +9 -9
- package/.docs/models/providers/deepseek.md +1 -1
- package/.docs/models/providers/google.md +11 -11
- package/.docs/models/providers/openai.md +19 -19
- package/.docs/models/providers/opencode.md +33 -33
- package/.docs/models/providers/xai.md +3 -3
- package/.docs/reference/agents/agent.md +20 -20
- package/.docs/reference/agents/generate.md +200 -66
- package/.docs/reference/agents/generateLegacy.md +77 -35
- package/.docs/reference/agents/getDefaultGenerateOptions.md +4 -6
- package/.docs/reference/agents/getDefaultOptions.md +4 -6
- package/.docs/reference/agents/getDefaultStreamOptions.md +4 -6
- package/.docs/reference/agents/getDescription.md +1 -1
- package/.docs/reference/agents/getInstructions.md +4 -6
- package/.docs/reference/agents/getLLM.md +6 -8
- package/.docs/reference/agents/getMemory.md +4 -6
- package/.docs/reference/agents/getModel.md +4 -6
- package/.docs/reference/agents/getTools.md +5 -7
- package/.docs/reference/agents/getVoice.md +4 -6
- package/.docs/reference/agents/listAgents.md +4 -6
- package/.docs/reference/agents/listScorers.md +4 -6
- package/.docs/reference/agents/listTools.md +4 -6
- package/.docs/reference/agents/listWorkflows.md +4 -6
- package/.docs/reference/agents/network.md +69 -23
- package/.docs/reference/ai-sdk/chat-route.md +7 -7
- package/.docs/reference/ai-sdk/handle-chat-stream.md +12 -12
- package/.docs/reference/ai-sdk/handle-network-stream.md +4 -4
- package/.docs/reference/ai-sdk/handle-workflow-stream.md +11 -11
- package/.docs/reference/ai-sdk/network-route.md +3 -3
- package/.docs/reference/ai-sdk/to-ai-sdk-stream.md +9 -9
- package/.docs/reference/ai-sdk/to-ai-sdk-v4-messages.md +9 -9
- package/.docs/reference/ai-sdk/to-ai-sdk-v5-messages.md +5 -5
- package/.docs/reference/ai-sdk/with-mastra.md +12 -12
- package/.docs/reference/ai-sdk/workflow-route.md +3 -3
- package/.docs/reference/auth/auth0.md +6 -6
- package/.docs/reference/auth/better-auth.md +5 -5
- package/.docs/reference/auth/clerk.md +5 -5
- package/.docs/reference/auth/firebase.md +7 -7
- package/.docs/reference/auth/jwt.md +1 -1
- package/.docs/reference/auth/supabase.md +4 -4
- package/.docs/reference/auth/workos.md +6 -6
- package/.docs/reference/cli/create-mastra.md +14 -14
- package/.docs/reference/client-js/mastra-client.md +23 -23
- package/.docs/reference/client-js/workflows.md +3 -3
- package/.docs/reference/core/addGateway.md +2 -2
- package/.docs/reference/core/getAgent.md +2 -2
- package/.docs/reference/core/getAgentById.md +2 -2
- package/.docs/reference/core/getDeployer.md +1 -1
- package/.docs/reference/core/getGateway.md +2 -2
- package/.docs/reference/core/getGatewayById.md +2 -2
- package/.docs/reference/core/getLogger.md +1 -1
- package/.docs/reference/core/getMCPServer.md +2 -2
- package/.docs/reference/core/getMCPServerById.md +3 -3
- package/.docs/reference/core/getMemory.md +2 -2
- package/.docs/reference/core/getScorer.md +2 -2
- package/.docs/reference/core/getScorerById.md +2 -2
- package/.docs/reference/core/getServer.md +1 -1
- package/.docs/reference/core/getStorage.md +1 -1
- package/.docs/reference/core/getStoredAgentById.md +18 -20
- package/.docs/reference/core/getTelemetry.md +1 -1
- package/.docs/reference/core/getVector.md +2 -2
- package/.docs/reference/core/getWorkflow.md +3 -3
- package/.docs/reference/core/listAgents.md +1 -1
- package/.docs/reference/core/listGateways.md +1 -1
- package/.docs/reference/core/listLogs.md +9 -11
- package/.docs/reference/core/listLogsByRunId.md +9 -9
- package/.docs/reference/core/listMCPServers.md +1 -1
- package/.docs/reference/core/listMemory.md +1 -1
- package/.docs/reference/core/listScorers.md +1 -1
- package/.docs/reference/core/listStoredAgents.md +9 -11
- package/.docs/reference/core/listVectors.md +1 -1
- package/.docs/reference/core/listWorkflows.md +2 -2
- package/.docs/reference/core/mastra-class.md +17 -17
- package/.docs/reference/core/mastra-model-gateway.md +15 -15
- package/.docs/reference/core/setLogger.md +2 -4
- package/.docs/reference/core/setStorage.md +1 -1
- package/.docs/reference/datasets/addItem.md +20 -4
- package/.docs/reference/datasets/addItems.md +8 -2
- package/.docs/reference/datasets/compareExperiments.md +15 -3
- package/.docs/reference/datasets/create.md +6 -6
- package/.docs/reference/datasets/dataset.md +1 -1
- package/.docs/reference/datasets/delete.md +2 -2
- package/.docs/reference/datasets/deleteExperiment.md +2 -2
- package/.docs/reference/datasets/deleteItem.md +2 -2
- package/.docs/reference/datasets/deleteItems.md +2 -2
- package/.docs/reference/datasets/get.md +2 -2
- package/.docs/reference/datasets/getDetails.md +9 -9
- package/.docs/reference/datasets/getExperiment.md +2 -2
- package/.docs/reference/datasets/getItem.md +3 -3
- package/.docs/reference/datasets/getItemHistory.md +22 -2
- package/.docs/reference/datasets/list.md +7 -3
- package/.docs/reference/datasets/listExperimentResults.md +34 -4
- package/.docs/reference/datasets/listExperiments.md +41 -3
- package/.docs/reference/datasets/listItems.md +18 -6
- package/.docs/reference/datasets/listVersions.md +23 -3
- package/.docs/reference/datasets/startExperiment.md +62 -12
- package/.docs/reference/datasets/startExperimentAsync.md +5 -1
- package/.docs/reference/datasets/update.md +6 -6
- package/.docs/reference/datasets/updateItem.md +5 -5
- package/.docs/reference/deployer.md +8 -8
- package/.docs/reference/evals/answer-relevancy.md +11 -11
- package/.docs/reference/evals/answer-similarity.md +17 -19
- package/.docs/reference/evals/bias.md +10 -10
- package/.docs/reference/evals/completeness.md +3 -3
- package/.docs/reference/evals/content-similarity.md +6 -6
- package/.docs/reference/evals/context-precision.md +4 -4
- package/.docs/reference/evals/context-relevance.md +4 -4
- package/.docs/reference/evals/create-scorer.md +47 -49
- package/.docs/reference/evals/faithfulness.md +11 -11
- package/.docs/reference/evals/hallucination.md +17 -21
- package/.docs/reference/evals/keyword-coverage.md +4 -4
- package/.docs/reference/evals/mastra-scorer.md +14 -14
- package/.docs/reference/evals/noise-sensitivity.md +4 -4
- package/.docs/reference/evals/prompt-alignment.md +4 -4
- package/.docs/reference/evals/run-evals.md +16 -16
- package/.docs/reference/evals/scorer-utils.md +3 -3
- package/.docs/reference/evals/textual-difference.md +3 -3
- package/.docs/reference/evals/tone-consistency.md +3 -3
- package/.docs/reference/evals/tool-call-accuracy.md +5 -5
- package/.docs/reference/evals/toxicity.md +8 -8
- package/.docs/reference/harness/harness-class.md +34 -42
- package/.docs/reference/logging/pino-logger.md +5 -5
- package/.docs/reference/memory/clone-utilities.md +5 -5
- package/.docs/reference/memory/cloneThread.md +17 -21
- package/.docs/reference/memory/createThread.md +10 -10
- package/.docs/reference/memory/deleteMessages.md +2 -2
- package/.docs/reference/memory/getThreadById.md +2 -2
- package/.docs/reference/memory/listThreads.md +5 -5
- package/.docs/reference/memory/memory-class.md +12 -14
- package/.docs/reference/memory/observational-memory.md +102 -94
- package/.docs/reference/memory/recall.md +14 -16
- package/.docs/reference/observability/tracing/configuration.md +27 -10
- package/.docs/reference/observability/tracing/exporters/console-exporter.md +4 -7
- package/.docs/reference/processors/batch-parts-processor.md +8 -10
- package/.docs/reference/processors/language-detector.md +14 -16
- package/.docs/reference/processors/message-history-processor.md +7 -9
- package/.docs/reference/processors/moderation-processor.md +13 -15
- package/.docs/reference/processors/pii-detector.md +14 -16
- package/.docs/reference/processors/processor-interface.md +62 -62
- package/.docs/reference/processors/prompt-injection-detector.md +11 -13
- package/.docs/reference/processors/semantic-recall-processor.md +14 -16
- package/.docs/reference/processors/system-prompt-scrubber.md +12 -14
- package/.docs/reference/processors/token-limiter-processor.md +11 -13
- package/.docs/reference/processors/tool-call-filter.md +5 -7
- package/.docs/reference/processors/tool-search-processor.md +9 -11
- package/.docs/reference/processors/unicode-normalizer.md +8 -10
- package/.docs/reference/processors/working-memory-processor.md +14 -18
- package/.docs/reference/rag/chunk.md +38 -38
- package/.docs/reference/rag/database-config.md +11 -7
- package/.docs/reference/rag/document.md +2 -2
- package/.docs/reference/rag/embeddings.md +12 -12
- package/.docs/reference/rag/extract-params.md +23 -23
- package/.docs/reference/rag/graph-rag.md +12 -12
- package/.docs/reference/rag/rerank.md +25 -17
- package/.docs/reference/rag/rerankWithScorer.md +25 -17
- package/.docs/reference/server/create-route.md +14 -14
- package/.docs/reference/server/express-adapter.md +10 -10
- package/.docs/reference/server/fastify-adapter.md +10 -10
- package/.docs/reference/server/hono-adapter.md +10 -10
- package/.docs/reference/server/koa-adapter.md +10 -10
- package/.docs/reference/server/mastra-server.md +10 -10
- package/.docs/reference/server/register-api-route.md +13 -13
- package/.docs/reference/storage/cloudflare-d1.md +5 -5
- package/.docs/reference/storage/cloudflare.md +6 -6
- package/.docs/reference/storage/composite.md +9 -9
- package/.docs/reference/storage/convex.md +3 -3
- package/.docs/reference/storage/dynamodb.md +9 -9
- package/.docs/reference/storage/lance.md +3 -3
- package/.docs/reference/storage/libsql.md +2 -2
- package/.docs/reference/storage/mongodb.md +5 -5
- package/.docs/reference/storage/mssql.md +2 -2
- package/.docs/reference/storage/postgresql.md +25 -25
- package/.docs/reference/storage/upstash.md +3 -3
- package/.docs/reference/streaming/ChunkType.md +251 -59
- package/.docs/reference/streaming/agents/MastraModelOutput.md +86 -16
- package/.docs/reference/streaming/agents/stream.md +155 -43
- package/.docs/reference/streaming/agents/streamLegacy.md +79 -39
- package/.docs/reference/streaming/workflows/resumeStream.md +18 -8
- package/.docs/reference/streaming/workflows/stream.md +21 -9
- package/.docs/reference/streaming/workflows/timeTravelStream.md +4 -4
- package/.docs/reference/tools/create-tool.md +25 -21
- package/.docs/reference/tools/document-chunker-tool.md +7 -7
- package/.docs/reference/tools/graph-rag-tool.md +16 -18
- package/.docs/reference/tools/mcp-client.md +38 -27
- package/.docs/reference/tools/mcp-server.md +45 -45
- package/.docs/reference/tools/vector-query-tool.md +34 -22
- package/.docs/reference/vectors/astra.md +22 -22
- package/.docs/reference/vectors/chroma.md +44 -44
- package/.docs/reference/vectors/convex.md +26 -26
- package/.docs/reference/vectors/couchbase.md +30 -30
- package/.docs/reference/vectors/duckdb.md +29 -29
- package/.docs/reference/vectors/elasticsearch.md +27 -27
- package/.docs/reference/vectors/lance.md +46 -38
- package/.docs/reference/vectors/libsql.md +31 -31
- package/.docs/reference/vectors/mongodb.md +32 -32
- package/.docs/reference/vectors/opensearch.md +27 -27
- package/.docs/reference/vectors/pg.md +60 -44
- package/.docs/reference/vectors/pinecone.md +38 -38
- package/.docs/reference/vectors/qdrant.md +36 -36
- package/.docs/reference/vectors/s3vectors.md +24 -24
- package/.docs/reference/vectors/turbopuffer.md +29 -29
- package/.docs/reference/vectors/upstash.md +25 -25
- package/.docs/reference/vectors/vectorize.md +27 -27
- package/.docs/reference/voice/azure.md +19 -15
- package/.docs/reference/voice/cloudflare.md +10 -12
- package/.docs/reference/voice/composite-voice.md +10 -10
- package/.docs/reference/voice/deepgram.md +20 -14
- package/.docs/reference/voice/elevenlabs.md +20 -22
- package/.docs/reference/voice/google-gemini-live.md +42 -44
- package/.docs/reference/voice/google.md +25 -21
- package/.docs/reference/voice/mastra-voice.md +20 -20
- package/.docs/reference/voice/murf.md +24 -28
- package/.docs/reference/voice/openai-realtime.md +26 -26
- package/.docs/reference/voice/openai.md +14 -12
- package/.docs/reference/voice/playai.md +13 -15
- package/.docs/reference/voice/sarvam.md +21 -25
- package/.docs/reference/voice/speechify.md +11 -13
- package/.docs/reference/voice/voice.addInstructions.md +1 -1
- package/.docs/reference/voice/voice.addTools.md +1 -1
- package/.docs/reference/voice/voice.answer.md +1 -1
- package/.docs/reference/voice/voice.connect.md +3 -3
- package/.docs/reference/voice/voice.events.md +11 -11
- package/.docs/reference/voice/voice.getSpeakers.md +30 -30
- package/.docs/reference/voice/voice.listen.md +9 -9
- package/.docs/reference/voice/voice.off.md +2 -2
- package/.docs/reference/voice/voice.on.md +2 -2
- package/.docs/reference/voice/voice.send.md +1 -1
- package/.docs/reference/voice/voice.speak.md +11 -11
- package/.docs/reference/voice/voice.updateConfig.md +3 -3
- package/.docs/reference/workflows/run-methods/cancel.md +2 -2
- package/.docs/reference/workflows/run-methods/restart.md +17 -5
- package/.docs/reference/workflows/run-methods/resume.md +23 -9
- package/.docs/reference/workflows/run-methods/start.md +22 -8
- package/.docs/reference/workflows/run-methods/startAsync.md +12 -6
- package/.docs/reference/workflows/run-methods/timeTravel.md +29 -13
- package/.docs/reference/workflows/run.md +12 -12
- package/.docs/reference/workflows/step.md +24 -26
- package/.docs/reference/workflows/workflow-methods/branch.md +2 -2
- package/.docs/reference/workflows/workflow-methods/commit.md +1 -1
- package/.docs/reference/workflows/workflow-methods/create-run.md +4 -4
- package/.docs/reference/workflows/workflow-methods/dountil.md +3 -3
- package/.docs/reference/workflows/workflow-methods/dowhile.md +3 -3
- package/.docs/reference/workflows/workflow-methods/foreach.md +9 -9
- package/.docs/reference/workflows/workflow-methods/map.md +2 -2
- package/.docs/reference/workflows/workflow-methods/parallel.md +2 -2
- package/.docs/reference/workflows/workflow-methods/sleep.md +2 -2
- package/.docs/reference/workflows/workflow-methods/sleepUntil.md +2 -2
- package/.docs/reference/workflows/workflow-methods/then.md +2 -2
- package/.docs/reference/workflows/workflow.md +40 -50
- package/.docs/reference/workspace/daytona-sandbox.md +33 -33
- package/.docs/reference/workspace/e2b-sandbox.md +20 -20
- package/.docs/reference/workspace/filesystem.md +22 -22
- package/.docs/reference/workspace/gcs-filesystem.md +15 -15
- package/.docs/reference/workspace/local-filesystem.md +35 -35
- package/.docs/reference/workspace/local-sandbox.md +26 -26
- package/.docs/reference/workspace/s3-filesystem.md +18 -18
- package/.docs/reference/workspace/sandbox.md +8 -8
- package/.docs/reference/workspace/workspace-class.md +30 -34
- package/CHANGELOG.md +16 -0
- package/package.json +6 -6
- package/.docs/docs/getting-started/start.md +0 -28
|
@@ -28,15 +28,13 @@ const speakers = await voice.getSpeakers()
|
|
|
28
28
|
|
|
29
29
|
## Constructor Parameters
|
|
30
30
|
|
|
31
|
-
**speechModel
|
|
31
|
+
**speechModel** (`ElevenLabsVoiceConfig`): Configuration for text-to-speech functionality. (Default: `{ name: 'eleven_multilingual_v2' }`)
|
|
32
32
|
|
|
33
|
-
**
|
|
33
|
+
**speechModel.name** (`ElevenLabsModel`): The ElevenLabs model to use
|
|
34
34
|
|
|
35
|
-
|
|
35
|
+
**speechModel.apiKey** (`string`): ElevenLabs API key. Falls back to ELEVENLABS\_API\_KEY environment variable
|
|
36
36
|
|
|
37
|
-
**
|
|
38
|
-
|
|
39
|
-
**apiKey?:** (`string`): ElevenLabs API key. Falls back to ELEVENLABS\_API\_KEY environment variable
|
|
37
|
+
**speaker** (`string`): ID of the speaker to use for text-to-speech (Default: `'9BWtsMINqrJLrRacOk9x' (Aria voice)`)
|
|
40
38
|
|
|
41
39
|
## Methods
|
|
42
40
|
|
|
@@ -44,11 +42,11 @@ const speakers = await voice.getSpeakers()
|
|
|
44
42
|
|
|
45
43
|
Converts text to speech using the configured speech model and voice.
|
|
46
44
|
|
|
47
|
-
**input
|
|
45
|
+
**input** (`string | NodeJS.ReadableStream`): Text to convert to speech. If a stream is provided, it will be converted to text first.
|
|
48
46
|
|
|
49
|
-
**options
|
|
47
|
+
**options** (`object`): Additional options for speech synthesis
|
|
50
48
|
|
|
51
|
-
**options.speaker
|
|
49
|
+
**options.speaker** (`string`): Override the default speaker ID for this request
|
|
52
50
|
|
|
53
51
|
Returns: `Promise<NodeJS.ReadableStream>`
|
|
54
52
|
|
|
@@ -56,37 +54,37 @@ Returns: `Promise<NodeJS.ReadableStream>`
|
|
|
56
54
|
|
|
57
55
|
Returns an array of available voice options, where each node contains:
|
|
58
56
|
|
|
59
|
-
**voiceId
|
|
57
|
+
**voiceId** (`string`): Unique identifier for the voice
|
|
60
58
|
|
|
61
|
-
**name
|
|
59
|
+
**name** (`string`): Display name of the voice
|
|
62
60
|
|
|
63
|
-
**language
|
|
61
|
+
**language** (`string`): Language code for the voice
|
|
64
62
|
|
|
65
|
-
**gender
|
|
63
|
+
**gender** (`string`): Gender of the voice
|
|
66
64
|
|
|
67
65
|
### listen()
|
|
68
66
|
|
|
69
67
|
Converts audio input to text using ElevenLabs Speech-to-Text API.
|
|
70
68
|
|
|
71
|
-
**input
|
|
69
|
+
**input** (`NodeJS.ReadableStream`): A readable stream containing the audio data to transcribe
|
|
72
70
|
|
|
73
|
-
**options
|
|
71
|
+
**options** (`object`): Configuration options for the transcription
|
|
74
72
|
|
|
75
73
|
The options object supports the following properties:
|
|
76
74
|
|
|
77
|
-
**language\_code
|
|
75
|
+
**language\_code** (`string`): ISO language code (e.g., 'en', 'fr', 'es')
|
|
78
76
|
|
|
79
|
-
**tag\_audio\_events
|
|
77
|
+
**tag\_audio\_events** (`boolean`): Whether to tag audio events like \[MUSIC], \[LAUGHTER], etc.
|
|
80
78
|
|
|
81
|
-
**num\_speakers
|
|
79
|
+
**num\_speakers** (`number`): Number of speakers to detect in the audio
|
|
82
80
|
|
|
83
|
-
**filetype
|
|
81
|
+
**filetype** (`string`): Audio file format (e.g., 'mp3', 'wav', 'ogg')
|
|
84
82
|
|
|
85
|
-
**timeoutInSeconds
|
|
83
|
+
**timeoutInSeconds** (`number`): Request timeout in seconds
|
|
86
84
|
|
|
87
|
-
**maxRetries
|
|
85
|
+
**maxRetries** (`number`): Maximum number of retry attempts
|
|
88
86
|
|
|
89
|
-
**abortSignal
|
|
87
|
+
**abortSignal** (`AbortSignal`): Signal to abort the request
|
|
90
88
|
|
|
91
89
|
Returns: `Promise<string>` - A Promise that resolves to the transcribed text
|
|
92
90
|
|
|
@@ -90,37 +90,35 @@ voice.close()
|
|
|
90
90
|
|
|
91
91
|
### Constructor Options
|
|
92
92
|
|
|
93
|
-
**apiKey
|
|
93
|
+
**apiKey** (`string`): Google API key for Gemini API authentication. Required unless using Vertex AI.
|
|
94
94
|
|
|
95
|
-
**model
|
|
95
|
+
**model** (`GeminiVoiceModel`): The model ID to use for real-time voice interactions. (Default: `'gemini-2.0-flash-exp'`)
|
|
96
96
|
|
|
97
|
-
**speaker
|
|
97
|
+
**speaker** (`GeminiVoiceName`): Default voice ID for speech synthesis. (Default: `'Puck'`)
|
|
98
98
|
|
|
99
|
-
**vertexAI
|
|
99
|
+
**vertexAI** (`boolean`): Use Vertex AI instead of Gemini API for authentication. (Default: `false`)
|
|
100
100
|
|
|
101
|
-
**project
|
|
101
|
+
**project** (`string`): Google Cloud project ID (required for Vertex AI).
|
|
102
102
|
|
|
103
|
-
**location
|
|
103
|
+
**location** (`string`): Google Cloud region for Vertex AI. (Default: `'us-central1'`)
|
|
104
104
|
|
|
105
|
-
**serviceAccountKeyFile
|
|
105
|
+
**serviceAccountKeyFile** (`string`): Path to service account JSON key file for Vertex AI authentication.
|
|
106
106
|
|
|
107
|
-
**serviceAccountEmail
|
|
107
|
+
**serviceAccountEmail** (`string`): Service account email for impersonation (alternative to key file).
|
|
108
108
|
|
|
109
|
-
**instructions
|
|
109
|
+
**instructions** (`string`): System instructions for the model.
|
|
110
110
|
|
|
111
|
-
**sessionConfig
|
|
111
|
+
**sessionConfig** (`GeminiSessionConfig`): Session configuration including interrupt and context settings.
|
|
112
112
|
|
|
113
|
-
**
|
|
113
|
+
**sessionConfig.interrupts** (`object`): Interrupt handling configuration.
|
|
114
114
|
|
|
115
|
-
|
|
115
|
+
**sessionConfig.interrupts.enabled** (`boolean`): Enable interrupt handling.
|
|
116
116
|
|
|
117
|
-
**interrupts
|
|
117
|
+
**sessionConfig.interrupts.allowUserInterruption** (`boolean`): Allow user to interrupt model responses.
|
|
118
118
|
|
|
119
|
-
**
|
|
119
|
+
**sessionConfig.contextCompression** (`boolean`): Enable automatic context compression.
|
|
120
120
|
|
|
121
|
-
**
|
|
122
|
-
|
|
123
|
-
**contextCompression?:** (`boolean`): Enable automatic context compression. (Default: `false`)
|
|
121
|
+
**debug** (`boolean`): Enable debug logging for troubleshooting. (Default: `false`)
|
|
124
122
|
|
|
125
123
|
## Methods
|
|
126
124
|
|
|
@@ -128,23 +126,23 @@ voice.close()
|
|
|
128
126
|
|
|
129
127
|
Establishes a connection to the Gemini Live API. Must be called before using speak, listen, or send methods.
|
|
130
128
|
|
|
131
|
-
**requestContext
|
|
129
|
+
**requestContext** (`object`): Optional request context for the connection.
|
|
132
130
|
|
|
133
|
-
**returns
|
|
131
|
+
**returns** (`Promise<void>`): Promise that resolves when the connection is established.
|
|
134
132
|
|
|
135
133
|
### speak()
|
|
136
134
|
|
|
137
135
|
Converts text to speech and sends it to the model. Can accept either a string or a readable stream as input.
|
|
138
136
|
|
|
139
|
-
**input
|
|
137
|
+
**input** (`string | NodeJS.ReadableStream`): Text or text stream to convert to speech.
|
|
140
138
|
|
|
141
|
-
**options
|
|
139
|
+
**options** (`GeminiLiveVoiceOptions`): Optional speech configuration.
|
|
142
140
|
|
|
143
|
-
**options.speaker
|
|
141
|
+
**options.speaker** (`GeminiVoiceName`): Voice ID to use for this specific speech request. (Default: `Constructor's speaker value`)
|
|
144
142
|
|
|
145
|
-
**options.languageCode
|
|
143
|
+
**options.languageCode** (`string`): Language code for the response.
|
|
146
144
|
|
|
147
|
-
**options.responseModalities
|
|
145
|
+
**options.responseModalities** (`('AUDIO' | 'TEXT')[]`): Response modalities to receive from the model. (Default: `['AUDIO', 'TEXT']`)
|
|
148
146
|
|
|
149
147
|
Returns: `Promise<void>` (responses are emitted via `speaker` and `writing` events)
|
|
150
148
|
|
|
@@ -152,9 +150,9 @@ Returns: `Promise<void>` (responses are emitted via `speaker` and `writing` even
|
|
|
152
150
|
|
|
153
151
|
Processes audio input for speech recognition. Takes a readable stream of audio data and returns the transcribed text.
|
|
154
152
|
|
|
155
|
-
**audioStream
|
|
153
|
+
**audioStream** (`NodeJS.ReadableStream`): Audio stream to transcribe.
|
|
156
154
|
|
|
157
|
-
**options
|
|
155
|
+
**options** (`GeminiLiveVoiceOptions`): Optional listening configuration.
|
|
158
156
|
|
|
159
157
|
Returns: `Promise<string>` - The transcribed text
|
|
160
158
|
|
|
@@ -162,7 +160,7 @@ Returns: `Promise<string>` - The transcribed text
|
|
|
162
160
|
|
|
163
161
|
Streams audio data in real-time to the Gemini service for continuous audio streaming scenarios like live microphone input.
|
|
164
162
|
|
|
165
|
-
**audioData
|
|
163
|
+
**audioData** (`NodeJS.ReadableStream | Int16Array`): Audio stream or buffer to send to the service.
|
|
166
164
|
|
|
167
165
|
Returns: `Promise<void>`
|
|
168
166
|
|
|
@@ -170,7 +168,7 @@ Returns: `Promise<void>`
|
|
|
170
168
|
|
|
171
169
|
Updates the session configuration dynamically. This can be used to modify voice settings, speaker selection, and other runtime configurations.
|
|
172
170
|
|
|
173
|
-
**config
|
|
171
|
+
**config** (`Partial<GeminiLiveVoiceConfig>`): Configuration updates to apply.
|
|
174
172
|
|
|
175
173
|
Returns: `Promise<void>`
|
|
176
174
|
|
|
@@ -178,7 +176,7 @@ Returns: `Promise<void>`
|
|
|
178
176
|
|
|
179
177
|
Adds a set of tools to the voice instance. Tools allow the model to perform additional actions during conversations. When GeminiLiveVoice is added to an Agent, any tools configured for the Agent will automatically be available to the voice interface.
|
|
180
178
|
|
|
181
|
-
**tools
|
|
179
|
+
**tools** (`ToolsInput`): Tools configuration to equip.
|
|
182
180
|
|
|
183
181
|
Returns: `void`
|
|
184
182
|
|
|
@@ -186,7 +184,7 @@ Returns: `void`
|
|
|
186
184
|
|
|
187
185
|
Adds or updates system instructions for the model.
|
|
188
186
|
|
|
189
|
-
**instructions
|
|
187
|
+
**instructions** (`string`): System instructions to set.
|
|
190
188
|
|
|
191
189
|
Returns: `void`
|
|
192
190
|
|
|
@@ -194,7 +192,7 @@ Returns: `void`
|
|
|
194
192
|
|
|
195
193
|
Triggers a response from the model. This method is primarily used internally when integrated with an Agent.
|
|
196
194
|
|
|
197
|
-
**options
|
|
195
|
+
**options** (`Record<string, unknown>`): Optional parameters for the answer request.
|
|
198
196
|
|
|
199
197
|
Returns: `Promise<void>`
|
|
200
198
|
|
|
@@ -220,9 +218,9 @@ Returns: `void`
|
|
|
220
218
|
|
|
221
219
|
Registers an event listener for voice events.
|
|
222
220
|
|
|
223
|
-
**event
|
|
221
|
+
**event** (`string`): Name of the event to listen for.
|
|
224
222
|
|
|
225
|
-
**callback
|
|
223
|
+
**callback** (`Function`): Function to call when the event occurs.
|
|
226
224
|
|
|
227
225
|
Returns: `void`
|
|
228
226
|
|
|
@@ -230,9 +228,9 @@ Returns: `void`
|
|
|
230
228
|
|
|
231
229
|
Removes a previously registered event listener.
|
|
232
230
|
|
|
233
|
-
**event
|
|
231
|
+
**event** (`string`): Name of the event to stop listening to.
|
|
234
232
|
|
|
235
|
-
**callback
|
|
233
|
+
**callback** (`Function`): The specific callback function to remove.
|
|
236
234
|
|
|
237
235
|
Returns: `void`
|
|
238
236
|
|
|
@@ -240,23 +238,23 @@ Returns: `void`
|
|
|
240
238
|
|
|
241
239
|
The GeminiLiveVoice class emits the following events:
|
|
242
240
|
|
|
243
|
-
**speaker
|
|
241
|
+
**speaker** (`event`): Emitted when audio data is received from the model. Callback receives a NodeJS.ReadableStream.
|
|
244
242
|
|
|
245
|
-
**speaking
|
|
243
|
+
**speaking** (`event`): Emitted with audio metadata. Callback receives { audioData?: Int16Array, sampleRate?: number }.
|
|
246
244
|
|
|
247
|
-
**writing
|
|
245
|
+
**writing** (`event`): Emitted when transcribed text is available. Callback receives { text: string, role: 'assistant' | 'user' }.
|
|
248
246
|
|
|
249
|
-
**session
|
|
247
|
+
**session** (`event`): Emitted on session state changes. Callback receives { state: 'connecting' | 'connected' | 'disconnected' | 'disconnecting' | 'updated', config?: object }.
|
|
250
248
|
|
|
251
|
-
**turnComplete
|
|
249
|
+
**turnComplete** (`event`): Emitted when a conversation turn is completed. Callback receives { timestamp: number }.
|
|
252
250
|
|
|
253
|
-
**toolCall
|
|
251
|
+
**toolCall** (`event`): Emitted when the model requests a tool call. Callback receives { name: string, args: object, id: string }.
|
|
254
252
|
|
|
255
|
-
**usage
|
|
253
|
+
**usage** (`event`): Emitted with token usage information. Callback receives { inputTokens: number, outputTokens: number, totalTokens: number, modality: string }.
|
|
256
254
|
|
|
257
|
-
**error
|
|
255
|
+
**error** (`event`): Emitted when an error occurs. Callback receives { message: string, code?: string, details?: unknown }.
|
|
258
256
|
|
|
259
|
-
**interrupt
|
|
257
|
+
**interrupt** (`event`): Interrupt events. Callback receives { type: 'user' | 'model', timestamp: number }.
|
|
260
258
|
|
|
261
259
|
## Available Models
|
|
262
260
|
|
|
@@ -32,25 +32,29 @@ const voices = await voice.getSpeakers({ languageCode: 'en-US' })
|
|
|
32
32
|
|
|
33
33
|
## Constructor Parameters
|
|
34
34
|
|
|
35
|
-
**speechModel
|
|
35
|
+
**speechModel** (`GoogleModelConfig`): Configuration for text-to-speech functionality (Default: `{ apiKey: process.env.GOOGLE_API_KEY }`)
|
|
36
36
|
|
|
37
|
-
**
|
|
37
|
+
**speechModel.apiKey** (`string`): Google Cloud API key. Falls back to GOOGLE\_API\_KEY environment variable. Not used when vertexAI is true.
|
|
38
38
|
|
|
39
|
-
**
|
|
39
|
+
**speechModel.keyFilename** (`string`): Path to service account JSON key file. Falls back to GOOGLE\_APPLICATION\_CREDENTIALS environment variable.
|
|
40
40
|
|
|
41
|
-
**
|
|
41
|
+
**speechModel.credentials** (`object`): In-memory service account credentials object with client\_email and private\_key properties.
|
|
42
42
|
|
|
43
|
-
**
|
|
43
|
+
**listeningModel** (`GoogleModelConfig`): Configuration for speech-to-text functionality (Default: `{ apiKey: process.env.GOOGLE_API_KEY }`)
|
|
44
44
|
|
|
45
|
-
**
|
|
45
|
+
**listeningModel.apiKey** (`string`): Google Cloud API key. Falls back to GOOGLE\_API\_KEY environment variable. Not used when vertexAI is true.
|
|
46
46
|
|
|
47
|
-
|
|
47
|
+
**listeningModel.keyFilename** (`string`): Path to service account JSON key file. Falls back to GOOGLE\_APPLICATION\_CREDENTIALS environment variable.
|
|
48
48
|
|
|
49
|
-
**
|
|
49
|
+
**listeningModel.credentials** (`object`): In-memory service account credentials object with client\_email and private\_key properties.
|
|
50
50
|
|
|
51
|
-
**
|
|
51
|
+
**speaker** (`string`): Default voice ID to use for text-to-speech (Default: `'en-US-Casual-K'`)
|
|
52
52
|
|
|
53
|
-
**
|
|
53
|
+
**vertexAI** (`boolean`): Enable Vertex AI mode for enterprise deployments. Uses project-based authentication instead of API keys. Requires 'project' to be set. (Default: `false`)
|
|
54
|
+
|
|
55
|
+
**project** (`string`): Google Cloud project ID (required when vertexAI is true). Falls back to GOOGLE\_CLOUD\_PROJECT environment variable.
|
|
56
|
+
|
|
57
|
+
**location** (`string`): Google Cloud region for Vertex AI. Falls back to GOOGLE\_CLOUD\_LOCATION environment variable. (Default: `'us-central1'`)
|
|
54
58
|
|
|
55
59
|
## Methods
|
|
56
60
|
|
|
@@ -58,15 +62,15 @@ const voices = await voice.getSpeakers({ languageCode: 'en-US' })
|
|
|
58
62
|
|
|
59
63
|
Converts text to speech using Google Cloud Text-to-Speech service.
|
|
60
64
|
|
|
61
|
-
**input
|
|
65
|
+
**input** (`string | NodeJS.ReadableStream`): Text to convert to speech. If a stream is provided, it will be converted to text first.
|
|
62
66
|
|
|
63
|
-
**options
|
|
67
|
+
**options** (`object`): Speech synthesis options
|
|
64
68
|
|
|
65
|
-
**options.speaker
|
|
69
|
+
**options.speaker** (`string`): Voice ID to use for this request
|
|
66
70
|
|
|
67
|
-
**options.languageCode
|
|
71
|
+
**options.languageCode** (`string`): Language code for the voice (e.g., 'en-US'). Defaults to the language code from the speaker ID or 'en-US'
|
|
68
72
|
|
|
69
|
-
**options.audioConfig
|
|
73
|
+
**options.audioConfig** (`ISynthesizeSpeechRequest['audioConfig']`): Audio configuration options from Google Cloud Text-to-Speech API (Default: `{ audioEncoding: 'LINEAR16' }`)
|
|
70
74
|
|
|
71
75
|
Returns: `Promise<NodeJS.ReadableStream>`
|
|
72
76
|
|
|
@@ -74,13 +78,13 @@ Returns: `Promise<NodeJS.ReadableStream>`
|
|
|
74
78
|
|
|
75
79
|
Converts speech to text using Google Cloud Speech-to-Text service.
|
|
76
80
|
|
|
77
|
-
**audioStream
|
|
81
|
+
**audioStream** (`NodeJS.ReadableStream`): Audio stream to transcribe
|
|
78
82
|
|
|
79
|
-
**options
|
|
83
|
+
**options** (`object`): Recognition options
|
|
80
84
|
|
|
81
|
-
**options.stream
|
|
85
|
+
**options.stream** (`boolean`): Whether to use streaming recognition
|
|
82
86
|
|
|
83
|
-
**options.config
|
|
87
|
+
**options.config** (`IRecognitionConfig`): Recognition configuration from Google Cloud Speech-to-Text API (Default: `{ encoding: 'LINEAR16', languageCode: 'en-US' }`)
|
|
84
88
|
|
|
85
89
|
Returns: `Promise<string>`
|
|
86
90
|
|
|
@@ -88,9 +92,9 @@ Returns: `Promise<string>`
|
|
|
88
92
|
|
|
89
93
|
Returns an array of available voice options, where each node contains:
|
|
90
94
|
|
|
91
|
-
**voiceId
|
|
95
|
+
**voiceId** (`string`): Unique identifier for the voice
|
|
92
96
|
|
|
93
|
-
**languageCodes
|
|
97
|
+
**languageCodes** (`string[]`): List of language codes supported by this voice
|
|
94
98
|
|
|
95
99
|
### isUsingVertexAI()
|
|
96
100
|
|
|
@@ -79,31 +79,31 @@ class MyVoiceProvider extends MastraVoice {
|
|
|
79
79
|
|
|
80
80
|
## Constructor Parameters
|
|
81
81
|
|
|
82
|
-
**config
|
|
82
|
+
**config** (`VoiceConfig`): Configuration object for the voice service
|
|
83
83
|
|
|
84
|
-
**config.speechModel
|
|
84
|
+
**config.speechModel** (`BuiltInModelConfig`): Configuration for the text-to-speech model
|
|
85
85
|
|
|
86
|
-
**config.
|
|
86
|
+
**config.speechModel.name** (`string`): Name of the model to use
|
|
87
87
|
|
|
88
|
-
**config.
|
|
88
|
+
**config.speechModel.apiKey** (`string`): API key for the model service
|
|
89
89
|
|
|
90
|
-
**config.
|
|
90
|
+
**config.listeningModel** (`BuiltInModelConfig`): Configuration for the speech-to-text model
|
|
91
91
|
|
|
92
|
-
**config.
|
|
92
|
+
**config.listeningModel.name** (`string`): Name of the model to use
|
|
93
93
|
|
|
94
|
-
|
|
94
|
+
**config.listeningModel.apiKey** (`string`): API key for the model service
|
|
95
95
|
|
|
96
|
-
**
|
|
96
|
+
**config.speaker** (`string`): Default speaker/voice ID to use
|
|
97
97
|
|
|
98
|
-
**
|
|
98
|
+
**config.name** (`string`): Name for the voice provider instance
|
|
99
99
|
|
|
100
|
-
|
|
100
|
+
**config.realtimeConfig** (`object`): Configuration for real-time speech-to-speech capabilities
|
|
101
101
|
|
|
102
|
-
**model
|
|
102
|
+
**config.realtimeConfig.model** (`string`): Model to use for real-time speech-to-speech capabilities
|
|
103
103
|
|
|
104
|
-
**apiKey
|
|
104
|
+
**config.realtimeConfig.apiKey** (`string`): API key for the real-time service
|
|
105
105
|
|
|
106
|
-
**options
|
|
106
|
+
**config.realtimeConfig.options** (`unknown`): Provider-specific options for real-time capabilities
|
|
107
107
|
|
|
108
108
|
## Abstract Methods
|
|
109
109
|
|
|
@@ -281,21 +281,21 @@ Purpose:
|
|
|
281
281
|
|
|
282
282
|
The MastraVoice class includes an event system for real-time communication. Standard event types include:
|
|
283
283
|
|
|
284
|
-
**speaking
|
|
284
|
+
**speaking** (`{ text: string; audioStream?: NodeJS.ReadableStream; audio?: Int16Array }`): Emitted when the voice provider is speaking, contains audio data
|
|
285
285
|
|
|
286
|
-
**writing
|
|
286
|
+
**writing** (`{ text: string, role: string }`): Emitted when text is transcribed from speech
|
|
287
287
|
|
|
288
|
-
**error
|
|
288
|
+
**error** (`{ message: string; code?: string; details?: unknown }`): Emitted when an error occurs
|
|
289
289
|
|
|
290
290
|
## Protected Properties
|
|
291
291
|
|
|
292
|
-
**listeningModel
|
|
292
|
+
**listeningModel** (`BuiltInModelConfig | undefined`): Configuration for the speech-to-text model
|
|
293
293
|
|
|
294
|
-
**speechModel
|
|
294
|
+
**speechModel** (`BuiltInModelConfig | undefined`): Configuration for the text-to-speech model
|
|
295
295
|
|
|
296
|
-
**speaker
|
|
296
|
+
**speaker** (`string | undefined`): Default speaker/voice ID
|
|
297
297
|
|
|
298
|
-
**realtimeConfig
|
|
298
|
+
**realtimeConfig** (`{ model?: string; apiKey?: string; options?: unknown } | undefined`): Configuration for real-time speech-to-speech capabilities
|
|
299
299
|
|
|
300
300
|
## Telemetry Support
|
|
301
301
|
|
|
@@ -45,41 +45,37 @@ const voices = await voice.getSpeakers()
|
|
|
45
45
|
|
|
46
46
|
## Constructor Parameters
|
|
47
47
|
|
|
48
|
-
**speechModel
|
|
48
|
+
**speechModel** (`MurfConfig`): Configuration for text-to-speech functionality (Default: `{ name: 'GEN2' }`)
|
|
49
49
|
|
|
50
|
-
**
|
|
50
|
+
**speechModel.name** (`'GEN1' | 'GEN2'`): The Murf model generation to use
|
|
51
51
|
|
|
52
|
-
|
|
52
|
+
**speechModel.apiKey** (`string`): Murf API key. Falls back to MURF\_API\_KEY environment variable
|
|
53
53
|
|
|
54
|
-
**
|
|
54
|
+
**speechModel.properties** (`object`): Default properties for all speech synthesis requests
|
|
55
55
|
|
|
56
|
-
**
|
|
56
|
+
**speechModel.properties.style** (`string`): Speaking style for the voice
|
|
57
57
|
|
|
58
|
-
**properties
|
|
58
|
+
**speechModel.properties.rate** (`number`): Speech rate multiplier
|
|
59
59
|
|
|
60
|
-
|
|
60
|
+
**speechModel.properties.pitch** (`number`): Voice pitch adjustment
|
|
61
61
|
|
|
62
|
-
**
|
|
62
|
+
**speechModel.properties.sampleRate** (`8000 | 24000 | 44100 | 48000`): Audio sample rate in Hz
|
|
63
63
|
|
|
64
|
-
**
|
|
64
|
+
**speechModel.properties.format** (`'MP3' | 'WAV' | 'FLAC' | 'ALAW' | 'ULAW'`): Output audio format
|
|
65
65
|
|
|
66
|
-
**
|
|
66
|
+
**speechModel.properties.channelType** (`'STEREO' | 'MONO'`): Audio channel configuration
|
|
67
67
|
|
|
68
|
-
**
|
|
68
|
+
**speechModel.properties.pronunciationDictionary** (`Record<string, string>`): Custom pronunciation mappings
|
|
69
69
|
|
|
70
|
-
**
|
|
70
|
+
**speechModel.properties.encodeAsBase64** (`boolean`): Whether to encode the audio as base64
|
|
71
71
|
|
|
72
|
-
**
|
|
72
|
+
**speechModel.properties.variation** (`number`): Voice variation parameter
|
|
73
73
|
|
|
74
|
-
**
|
|
74
|
+
**speechModel.properties.audioDuration** (`number`): Target audio duration in seconds
|
|
75
75
|
|
|
76
|
-
**
|
|
76
|
+
**speechModel.properties.multiNativeLocale** (`string`): Locale for multilingual support
|
|
77
77
|
|
|
78
|
-
**
|
|
79
|
-
|
|
80
|
-
**audioDuration?:** (`number`): Target audio duration in seconds
|
|
81
|
-
|
|
82
|
-
**multiNativeLocale?:** (`string`): Locale for multilingual support
|
|
78
|
+
**speaker** (`string`): Default voice ID to use for text-to-speech (Default: `'en-UK-hazel'`)
|
|
83
79
|
|
|
84
80
|
## Methods
|
|
85
81
|
|
|
@@ -87,13 +83,13 @@ const voices = await voice.getSpeakers()
|
|
|
87
83
|
|
|
88
84
|
Converts text to speech using Murf's API.
|
|
89
85
|
|
|
90
|
-
**input
|
|
86
|
+
**input** (`string | NodeJS.ReadableStream`): Text to convert to speech. If a stream is provided, it will be converted to text first.
|
|
91
87
|
|
|
92
|
-
**options
|
|
88
|
+
**options** (`object`): Speech synthesis options
|
|
93
89
|
|
|
94
|
-
**options.speaker
|
|
90
|
+
**options.speaker** (`string`): Override the default speaker for this request
|
|
95
91
|
|
|
96
|
-
**options.properties
|
|
92
|
+
**options.properties** (`object`): Override default speech properties for this request
|
|
97
93
|
|
|
98
94
|
Returns: `Promise<NodeJS.ReadableStream>`
|
|
99
95
|
|
|
@@ -101,13 +97,13 @@ Returns: `Promise<NodeJS.ReadableStream>`
|
|
|
101
97
|
|
|
102
98
|
Returns an array of available voice options, where each node contains:
|
|
103
99
|
|
|
104
|
-
**voiceId
|
|
100
|
+
**voiceId** (`string`): Unique identifier for the voice
|
|
105
101
|
|
|
106
|
-
**name
|
|
102
|
+
**name** (`string`): Display name of the voice
|
|
107
103
|
|
|
108
|
-
**language
|
|
104
|
+
**language** (`string`): Language code for the voice
|
|
109
105
|
|
|
110
|
-
**gender
|
|
106
|
+
**gender** (`string`): Gender of the voice
|
|
111
107
|
|
|
112
108
|
### listen()
|
|
113
109
|
|