npm - getpatter - Versions diffs - 0.6.1 → 0.6.2 - Mend

getpatter 0.6.1 → 0.6.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (14) hide show

package/dist/chunk-CL2U3YET.mjs +1429 -0
package/dist/{chunk-TEW3NAZJ.mjs → chunk-LE63CSOB.mjs} +371 -1486
package/dist/{chunk-RV7APPYE.mjs → chunk-R2T4JABZ.mjs} +13 -0
package/dist/cli.js +48 -23
package/dist/dashboard/ui.html +8 -8
package/dist/index.d.mts +452 -186
package/dist/index.d.ts +452 -186
package/dist/index.js +1485 -979
package/dist/index.mjs +973 -790
package/dist/openai-realtime-2-CNFARP25.mjs +8 -0
package/dist/{silero-vad-NSEXI4XS.mjs → silero-vad-LNDFGIY7.mjs} +1 -1
package/dist/{test-mode-WEKKNBLD.mjs → test-mode-RS57BDM6.mjs} +2 -1
package/package.json +1 -1
package/src/dashboard/ui.html +8 -8

package/dist/index.d.mts CHANGED Viewed

@@ -61,7 +61,11 @@ declare class Carrier {
 interface RealtimeOptions {
     /** API key. Falls back to OPENAI_API_KEY env var when omitted. */
     apiKey?: string;
-    /** Realtime model. Defaults to gpt-4o-mini-realtime-preview. */
+    /**
+     * Realtime model. Defaults to ``gpt-realtime-mini`` (bumped from the
+     * deprecated ``gpt-4o-mini-realtime-preview`` on 2026-05-25 for
+     * parity with the Python SDK and the GA Realtime API surface).
+     */
     model?: string;
     /** Voice preset. Defaults to alloy. */
     voice?: string;
@@ -1258,15 +1262,16 @@ interface AgentOptions {
      */
     prewarm?: boolean;
     /**
-     * When ``true`` (default ``false``), ``Patter.call`` also pre-renders
-     * ``firstMessage`` to TTS audio bytes during the ringing window and
-     * streams the cached buffer immediately when the carrier emits
-     * ``start``. Eliminates the 200-700 ms TTS first-byte latency on the
-     * greeting at the cost of paying the TTS bill even if the call is
-     * never answered (silently logged at warn level when the call
-     * fails). Off by default to preserve the prior cost surface; opt-in
-     * for production outbound where every millisecond of greeting
-     * latency hurts conversion. Default: ``false``.
+     * When ``true`` (default since 0.6.2 in pipeline mode), ``Patter.call``
+     * pre-renders ``firstMessage`` to TTS audio bytes during the ringing
+     * window and streams the cached buffer immediately when the carrier
+     * emits ``start``. Eliminates the 200-700 ms TTS first-byte latency
+     * on the greeting that dominated first-turn ``p95`` on every pipeline
+     * acceptance run. The trade-off is paying the TTS bill even if the
+     * call is never answered (silently logged at warn level when the call
+     * fails) — typically $0.001-$0.005 per ringing call depending on TTS
+     * provider. Opt out by passing ``prewarmFirstMessage: false`` (e.g.
+     * for very high-volume outbound where un-answered TTS spend matters).
      *
      * **Pipeline mode only.** Realtime / ConvAI provider modes never
      * consume the prewarm cache (the StreamHandler for those modes runs
@@ -1563,12 +1568,35 @@ declare class ElevenLabsTTS {
     private readonly apiKey;
     private readonly voiceId;
     private readonly modelId;
-    private readonly outputFormat;
+    private _outputFormat;
+    private readonly _outputFormatExplicit;
     private readonly voiceSettings;
     private readonly languageCode;
     private readonly chunkSize;
+    /**
+     * Public view of the (possibly auto-flipped) wire format. Read by the
+     * stream-handler to decide whether to skip the client-side resample +
+     * mulaw encode when the bytes are already in the carrier's wire codec.
+     */
+    get outputFormat(): ElevenLabsOutputFormat;
     constructor(apiKey: string, voiceId?: string, modelId?: string, outputFormat?: ElevenLabsOutputFormat | string);
     constructor(apiKey: string, options: ElevenLabsTTSOptions$1);
+    /**
+     * Hook called by ``StreamHandler.initPipeline`` to advise the carrier
+     * wire format. When the user did NOT pass an explicit ``outputFormat``,
+     * auto-flip to the carrier's native codec so the audio bytes ElevenLabs
+     * returns are already in Twilio/Telnyx wire format — eliminating the
+     * client-side 16 kHz → 8 kHz resample and PCM → μ-law encode. The
+     * resample/encode chain was a source of audible artifacts on the
+     * prewarmed firstMessage (see 0.6.2 acceptance notes — burst delivery
+     * of resampled audio crackled on the carrier-side jitter buffer).
+     *
+     * No-op when the caller passed an explicit ``outputFormat`` (incl. via
+     * the ``forTwilio`` / ``forTelnyx`` factories) — user wins.
+     *
+     * Parity with {@link ElevenLabsWebSocketTTS.setTelephonyCarrier}.
+     */
+    setTelephonyCarrier(carrier: string): void;
     /**
      * Construct an instance pre-configured for Twilio Media Streams.
      *
@@ -1695,6 +1723,20 @@ declare class ElevenLabsWebSocketTTS implements TTSAdapter {
      * changes.
      */
     private adoptedConnection;
+    /**
+     * Active WS for the in-flight ``synthesizeStream`` call, if any. Set
+     * when a stream starts, cleared in its ``finally`` block. The
+     * stream-handler calls ``cancelActiveStream()`` from ``cancelSpeaking``
+     * to unblock the generator's inner ``await Promise<frame>`` — without
+     * it, a barge-in on the firstMessage live path leaves the for-await
+     * stuck waiting for the next frame; ElevenLabs never sends
+     * ``isFinal=true`` after the consumer breaks, the 30 s frame timeout
+     * fires post-call, and meanwhile ``initPipeline`` never returns so
+     * the STT ``onTranscript`` callback never registers and subsequent
+     * user turns are silently dropped (root cause of the 2026-05-20
+     * "first message OK, then no response" symptom).
+     */
+    private activeStreamWs;
     /**
      * The wire format requested over the ElevenLabs WS. Initially set from
      * the constructor; ``setTelephonyCarrier`` may auto-flip it to the
@@ -1719,6 +1761,22 @@ declare class ElevenLabsWebSocketTTS implements TTSAdapter {
      * the user's choice always wins.
      */
     setTelephonyCarrier(carrier: string): void;
+    /**
+     * Force-close the WebSocket of any in-flight ``synthesizeStream`` call.
+     * Called by the stream-handler from ``cancelSpeaking`` (barge-in) so
+     * the generator's inner ``await Promise<frame>`` loop unblocks cleanly
+     * via the ``onClose`` handler — instead of waiting up to 30 s for the
+     * ``FRAME_TIMEOUT_MS`` watchdog to fire. No-op when no stream is in
+     * flight or when the WS is already closing.
+     *
+     * Without this, a barge-in during the firstMessage live path left the
+     * for-await stuck (ElevenLabs never sends ``isFinal=true`` after the
+     * consumer breaks), ``initPipeline`` never returned, the STT
+     * ``onTranscript`` callback never registered, and the entire remainder
+     * of the call was silent for the user. Surfaced during the 2026-05-20
+     * acceptance run.
+     */
+    cancelActiveStream(): void;
     /** Pre-configured for Twilio Media Streams (`ulaw_8000`). */
     static forTwilio(opts: Omit<ElevenLabsWebSocketTTSOptions, 'outputFormat'>): ElevenLabsWebSocketTTS;
     /** Pre-configured for Telnyx (`pcm_16000`). */
@@ -2777,6 +2835,27 @@ declare function geminiLive(opts: {
     voice?: string;
 }): RealtimeConfig;
+/**
+ * Default provider pricing and merge utilities.
+ *
+ * Pricing reflects public provider rates as of 2026. Each provider entry
+ * carries provider-level defaults (the model Patter ships with by default)
+ * plus an optional ``models`` map keyed by model identifier with per-model
+ * overrides. Cost-calc functions take an optional ``model`` arg and
+ * auto-resolve the rate via {@link resolveProviderRates} (longest-prefix
+ * match for versioned model IDs). When the agent's adapter exposes
+ * ``model`` and the metrics layer threads it through, the dashboard bills
+ * with model accuracy out of the box — no manual override needed.
+ *
+ * User overrides via ``new Patter({ pricing: {...} })`` keep working as
+ * before. To register a new model rate without touching the SDK source:
+ *
+ *     new Patter({ pricing: { elevenlabs: { models: { my_custom: { price: 0.075 } } } } })
+ */
+/** Pricing table version identifier, updated in lockstep with the Python SDK. */
+declare const PRICING_VERSION = "2026.3";
+/** ISO date the pricing table was last refreshed against public provider rates. */
+declare const PRICING_LAST_UPDATED = "2026-05-08";
 /**
  * Billing units used by ``DEFAULT_PRICING`` entries. String values keep the
  * pricing table JSON-serialisable and backwards-compatible with consumers
@@ -3067,6 +3146,21 @@ declare class CallMetricsAccumulator {
     private _bargeinStoppedAt;
     private _turnUserText;
     private _turnSttAudioSeconds;
+    /**
+     * Guard against the recordTurnInterrupted / recordTurnComplete race.
+     *
+     * A VAD-path barge-in fires ``recordTurnInterrupted`` synchronously
+     * inside ``handleAudioAsync`` while the in-flight pipeline LLM stream
+     * keeps unwinding on its own task. When the LLM stream eventually
+     * exits, the existing pipeline path falls through to
+     * ``recordTurnComplete``, which would push a second turn for the same
+     * logical exchange (this time carrying ``user_text=''`` because the
+     * field was already reset). ``_turnAlreadyClosed`` is flipped by
+     * ``recordTurnInterrupted`` and read by ``recordTurnComplete`` so the
+     * late ``recordTurnComplete`` becomes a no-op until the next
+     * ``startTurn`` re-arms the accumulator.
+     */
+    private _turnAlreadyClosed;
     private _totalSttAudioSeconds;
     private _totalTtsCharacters;
     private _totalRealtimeCost;
@@ -3202,9 +3296,26 @@ declare class CallMetricsAccumulator {
      * to compute ``bargein_ms``.
      */
     recordTtsStopped(ts?: number): void;
-    /** Close the current turn cleanly and append a `TurnMetrics` record. */
-    recordTurnComplete(agentText: string): TurnMetrics;
-    /** Close the current turn as interrupted (barge-in) and return the recorded metrics. */
+    /**
+     * Close the current turn cleanly and append a `TurnMetrics` record.
+     *
+     * Returns ``null`` when ``recordTurnInterrupted`` has already closed
+     * the current turn — this protects against the VAD-barge-in /
+     * pipeline-LLM race where both paths try to finalise the same logical
+     * turn and the second would otherwise push a phantom entry with
+     * ``user_text=''``. The caller treats ``null`` as "nothing to emit";
+     * ``emitTurnMetrics`` is already null-safe.
+     */
+    recordTurnComplete(agentText: string): TurnMetrics | null;
+    /**
+     * Close the current turn as interrupted (barge-in) and return the
+     * recorded metrics. Returns ``null`` when no turn is open, OR when
+     * ``recordTurnComplete`` has already finalised the current turn —
+     * bidirectional parity with the guard at the top of
+     * ``recordTurnComplete``. Prevents an out-of-order interruption (e.g.
+     * a future refactor that reorders the bargein + LLM-unwind paths)
+     * from overwriting a turn that the complete path already emitted.
+     */
     recordTurnInterrupted(): TurnMetrics | null;
     /**
      * Record the moment VAD emitted speech_end for the current utterance.
@@ -3346,6 +3457,67 @@ declare const OpenAIRealtimeAudioFormat: {
 };
 /** Union of {@link OpenAIRealtimeAudioFormat} string values. */
 type OpenAIRealtimeAudioFormat = (typeof OpenAIRealtimeAudioFormat)[keyof typeof OpenAIRealtimeAudioFormat];
+/**
+ * Known OpenAI Realtime API model identifiers.
+ *
+ * `GPT_REALTIME_2` is OpenAI's most-capable realtime voice model
+ * (speech-to-speech with configurable reasoning effort, stronger
+ * instruction following, 128K context). It accepts the same session
+ * update wire format as the v1 `gpt-realtime` family but supports an
+ * additional `reasoning.effort` field — see `reasoningEffort` on
+ * {@link OpenAIRealtimeOptions}. Pricing differs from the mini default;
+ * override `DEFAULT_PRICING.openai_realtime` with the values in
+ * `DEFAULT_PRICING.openai_realtime_2` when selecting it.
+ */
+declare const OpenAIRealtimeModel: {
+    readonly GPT_REALTIME: "gpt-realtime";
+    readonly GPT_REALTIME_2: "gpt-realtime-2";
+    readonly GPT_REALTIME_MINI: "gpt-realtime-mini";
+    readonly GPT_4O_REALTIME_PREVIEW: "gpt-4o-realtime-preview";
+    readonly GPT_4O_MINI_REALTIME_PREVIEW: "gpt-4o-mini-realtime-preview";
+};
+/** Union of {@link OpenAIRealtimeModel} string values. */
+type OpenAIRealtimeModel = (typeof OpenAIRealtimeModel)[keyof typeof OpenAIRealtimeModel];
+/** OpenAI Realtime / TTS voice identifiers. */
+declare const OpenAIVoice: {
+    readonly ALLOY: "alloy";
+    readonly ASH: "ash";
+    readonly BALLAD: "ballad";
+    readonly CORAL: "coral";
+    readonly ECHO: "echo";
+    readonly FABLE: "fable";
+    readonly NOVA: "nova";
+    readonly ONYX: "onyx";
+    readonly SAGE: "sage";
+    readonly SHIMMER: "shimmer";
+    readonly VERSE: "verse";
+};
+/** Union of {@link OpenAIVoice} string values. */
+type OpenAIVoice = (typeof OpenAIVoice)[keyof typeof OpenAIVoice];
+/**
+ * Models accepted by `input_audio_transcription` on Realtime sessions.
+ *
+ * `GPT_REALTIME_WHISPER` is OpenAI's streaming-optimised Whisper variant
+ * designed for low-latency transcript deltas inside a Realtime session.
+ * Billed per minute of audio (separate from the conversational model
+ * tokens). Use it when you want faster partial transcripts than
+ * `whisper-1` at lower cost than `gpt-4o-transcribe`.
+ */
+declare const OpenAITranscriptionModel: {
+    readonly WHISPER_1: "whisper-1";
+    readonly GPT_4O_TRANSCRIBE: "gpt-4o-transcribe";
+    readonly GPT_4O_MINI_TRANSCRIBE: "gpt-4o-mini-transcribe";
+    readonly GPT_REALTIME_WHISPER: "gpt-realtime-whisper";
+};
+/** Union of {@link OpenAITranscriptionModel} string values. */
+type OpenAITranscriptionModel = (typeof OpenAITranscriptionModel)[keyof typeof OpenAITranscriptionModel];
+/** Server-side voice-activity-detection modes. */
+declare const OpenAIRealtimeVADType: {
+    readonly SERVER_VAD: "server_vad";
+    readonly SEMANTIC_VAD: "semantic_vad";
+};
+/** Union of {@link OpenAIRealtimeVADType} string values. */
+type OpenAIRealtimeVADType = (typeof OpenAIRealtimeVADType)[keyof typeof OpenAIRealtimeVADType];
 /** Callback signature for events emitted by {@link OpenAIRealtimeAdapter}. */
 type RealtimeEventCallback = (type: string, data: unknown) => void | Promise<void>;
 /** Constructor options for {@link OpenAIRealtimeAdapter}. */
@@ -3493,6 +3665,17 @@ declare class OpenAIRealtimeAdapter {
     cancelResponse(): void;
     /** Inject a user text turn and request a new response. */
     sendText(text: string): Promise<void>;
+    /**
+     * Trigger `response.create` with no new user item.
+     *
+     * Used by the Realtime stream-handler to drive a response after the
+     * client-side hallucination filter accepts an
+     * `input_audio_transcription.completed` event. The server VAD config
+     * sets `create_response: false` so OpenAI no longer auto-creates a
+     * response on every `input_audio_buffer.committed`; Patter is now
+     * responsible for triggering it explicitly when a real user turn lands.
+     */
+    requestResponse(): Promise<void>;
     /**
      * Make the AI speak ``text`` as its opening line.
      *
@@ -4708,6 +4891,18 @@ interface Transcript$3 {
 }
 type TranscriptCallback$3 = (transcript: Transcript$3) => void;
 type ErrorCallback$1 = (error: Error) => void;
+/** Known Deepgram STT models. */
+declare const DeepgramModel: {
+    readonly NOVA_3: "nova-3";
+    readonly NOVA_2: "nova-2";
+    readonly NOVA_2_PHONECALL: "nova-2-phonecall";
+    readonly NOVA_2_GENERAL: "nova-2-general";
+    readonly NOVA_2_MEETING: "nova-2-meeting";
+    readonly NOVA: "nova";
+    readonly ENHANCED: "enhanced";
+    readonly BASE: "base";
+};
+type DeepgramModel = (typeof DeepgramModel)[keyof typeof DeepgramModel];
 /**
  * Optional tuning knobs for Deepgram live transcription.
  *
@@ -4834,6 +5029,202 @@ declare class DeepgramSTT {
     close(): void;
 }
+/**
+ * Cartesia TTS provider — HTTP `/tts/bytes` endpoint.
+ *
+ * Cartesia also offers a WebSocket streaming mode with word timestamps;
+ * this provider focuses on the chunked-bytes HTTP API which maps cleanly
+ * onto Patter's `synthesize(text)` contract and keeps the provider
+ * dependency-free (just `fetch`).
+ *
+ * Default model is `sonic-3` (GA snapshot `sonic-3-2026-01-12`) — Cartesia's
+ * current GA model with a documented ~90 ms TTFB target. Voice IDs from the
+ * sonic-2 generation (including the default Katie voice) remain compatible.
+ *
+ * **Telephony optimization** — the constructor default
+ * `sampleRate=16000` is correct for web playback, dashboard previews, and
+ * 16 kHz pipelines. For real phone calls, use the carrier-specific
+ * factories instead:
+ *
+ * - {@link CartesiaTTS.forTwilio} requests `sampleRate=8000` natively from
+ *   Cartesia. Twilio's media-stream WebSocket expects μ-law @ 8 kHz, so
+ *   the SDK normally resamples 16 kHz → 8 kHz before doing the PCM →
+ *   μ-law transcode in `TwilioAudioSender`. Asking Cartesia for 8 kHz
+ *   PCM at the source skips the resample step (saves ~10–30 ms first-
+ *   byte plus per-frame CPU and removes a potential aliasing source).
+ *   The PCM → μ-law transcode still happens client-side.
+ * - {@link CartesiaTTS.forTelnyx} requests `sampleRate=16000`. Telnyx
+ *   negotiates L16/16000 on its bidirectional media WebSocket, so
+ *   16 kHz PCM is already the format used end-to-end and no
+ *   transcoding happens. This is the same as the bare-constructor
+ *   default and exists for API symmetry with the Twilio factory.
+ */
+/** Known Cartesia TTS models. */
+declare const CartesiaTTSModel: {
+    readonly SONIC_3: "sonic-3";
+    readonly SONIC_2: "sonic-2";
+    readonly SONIC: "sonic";
+};
+type CartesiaTTSModel = (typeof CartesiaTTSModel)[keyof typeof CartesiaTTSModel];
+/** Common PCM sample rates accepted by the Cartesia bytes endpoint. */
+declare const CartesiaTTSSampleRate: {
+    readonly HZ_8000: 8000;
+    readonly HZ_16000: 16000;
+    readonly HZ_22050: 22050;
+    readonly HZ_24000: 24000;
+    readonly HZ_44100: 44100;
+};
+type CartesiaTTSSampleRate = (typeof CartesiaTTSSampleRate)[keyof typeof CartesiaTTSSampleRate];
+/** Voice-selection mode passed in the Cartesia bytes payload. */
+declare const CartesiaTTSVoiceMode: {
+    readonly ID: "id";
+    readonly EMBEDDING: "embedding";
+};
+type CartesiaTTSVoiceMode = (typeof CartesiaTTSVoiceMode)[keyof typeof CartesiaTTSVoiceMode];
+/** Constructor options for {@link CartesiaTTS}. */
+interface CartesiaTTSOptions$1 {
+    model?: CartesiaTTSModel | string;
+    voice?: string;
+    language?: string;
+    sampleRate?: CartesiaTTSSampleRate | number;
+    speed?: string | number;
+    emotion?: string | string[];
+    volume?: number;
+    baseUrl?: string;
+    apiVersion?: string;
+}
+/** Cartesia TTS provider backed by the HTTP `/tts/bytes` streaming endpoint. */
+declare class CartesiaTTS {
+    /** Stable pricing/dashboard key — read by stream-handler/metrics. */
+    static readonly providerKey = "cartesia_tts";
+    private readonly apiKey;
+    private readonly model;
+    private readonly voice;
+    private readonly language;
+    private readonly sampleRate;
+    private readonly speed?;
+    private readonly emotion?;
+    private readonly volume?;
+    private readonly baseUrl;
+    private readonly apiVersion;
+    constructor(apiKey: string, opts?: CartesiaTTSOptions$1);
+    /**
+     * Construct an instance pre-configured for Twilio Media Streams.
+     *
+     * Sets `sampleRate=8000` so Cartesia emits PCM_S16LE @ 8 kHz directly.
+     * Twilio's media stream uses μ-law @ 8 kHz so the SDK still does the
+     * PCM → μ-law transcode client-side, but the 16 kHz → 8 kHz resample
+     * step is skipped. Saves ~10–30 ms first-byte plus per-frame CPU and
+     * removes a potential aliasing source.
+     */
+    static forTwilio(apiKey: string, options?: Omit<CartesiaTTSOptions$1, 'sampleRate'>): CartesiaTTS;
+    /**
+     * Construct an instance pre-configured for Telnyx bidirectional media.
+     *
+     * Sets `sampleRate=16000` to match Telnyx's L16/16000 default codec —
+     * audio flows end-to-end with zero resampling or transcoding. Same as
+     * the bare-constructor default; exists for API symmetry with
+     * {@link CartesiaTTS.forTwilio}.
+     */
+    static forTelnyx(apiKey: string, options?: Omit<CartesiaTTSOptions$1, 'sampleRate'>): CartesiaTTS;
+    /** Build the JSON payload for the Cartesia bytes endpoint. */
+    private buildPayload;
+    /**
+     * Pre-call HTTP warmup for the Cartesia `/tts/bytes` endpoint.
+     *
+     * Issues a lightweight `GET <baseUrl>/voices` so DNS, TLS, and HTTP/2
+     * are already up by the time the first `synthesizeStream()` POST
+     * lands. Best-effort: 5 s timeout, all exceptions swallowed at
+     * debug level.
+     *
+     * Billing safety: `GET /voices` is a free metadata read on
+     * Cartesia's REST surface (per https://docs.cartesia.ai). It does
+     * not consume synthesis credits. The actual synthesis is billed
+     * only when `POST /tts/bytes` runs with a non-empty `transcript`.
+     *
+     * Note: Cartesia TTS uses the HTTP path (vs the WebSocket variant
+     * Cartesia also exposes) — connection warmup is therefore HTTP-GET
+     * based, not WebSocket pre-handshake. The latency win is smaller
+     * (~50-150 ms vs the ~200-500 ms of a WS prewarm) but still real.
+     */
+    warmup(): Promise<void>;
+    /** Synthesize text and return the concatenated audio buffer. */
+    synthesize(text: string): Promise<Buffer>;
+    /**
+     * Synthesize text and yield raw PCM_S16LE chunks at the configured
+     * `sampleRate` as they arrive from Cartesia.
+     */
+    synthesizeStream(text: string): AsyncGenerator<Buffer>;
+}
+/**
+ * Rime TTS provider — HTTP chunked endpoint.
+ *
+ * Supports both Arcana and Mist model families. The Arcana model can take
+ * up to ~80% of the output audio's duration to synthesize, so its request
+ * timeout is bumped to 4 minutes.
+ */
+/** Rime TTS model families. */
+declare const RimeModel: {
+    readonly ARCANA: "arcana";
+    readonly MIST: "mist";
+    readonly MIST_V2: "mistv2";
+};
+type RimeModel = (typeof RimeModel)[keyof typeof RimeModel];
+/** Supported response Content-Type accept headers for Rime TTS. */
+declare const RimeAudioFormat: {
+    readonly PCM: "audio/pcm";
+    readonly MP3: "audio/mp3";
+    readonly WAV: "audio/wav";
+    readonly MULAW: "audio/mulaw";
+};
+type RimeAudioFormat = (typeof RimeAudioFormat)[keyof typeof RimeAudioFormat];
+/** Constructor options for {@link RimeTTS}. */
+interface RimeTTSOptions$1 {
+    model?: string;
+    speaker?: string;
+    lang?: string;
+    sampleRate?: number;
+    repetitionPenalty?: number;
+    temperature?: number;
+    topP?: number;
+    maxTokens?: number;
+    speedAlpha?: number;
+    reduceLatency?: boolean;
+    pauseBetweenBrackets?: boolean;
+    phonemizeBetweenBrackets?: boolean;
+    baseUrl?: string;
+}
+/** Rime TTS adapter for the `users.rime.ai/v1/rime-tts` HTTP streaming endpoint. */
+declare class RimeTTS {
+    /** Stable pricing/dashboard key — read by stream-handler/metrics. */
+    static readonly providerKey = "rime";
+    private readonly apiKey;
+    private readonly model;
+    private readonly speaker;
+    private readonly lang;
+    private readonly sampleRate;
+    private readonly repetitionPenalty?;
+    private readonly temperature?;
+    private readonly topP?;
+    private readonly maxTokens?;
+    private readonly speedAlpha?;
+    private readonly reduceLatency?;
+    private readonly pauseBetweenBrackets?;
+    private readonly phonemizeBetweenBrackets?;
+    private readonly baseUrl;
+    private readonly totalTimeoutMs;
+    constructor(apiKey: string, opts?: RimeTTSOptions$1);
+    private buildPayload;
+    /** Synthesize text and return the concatenated audio buffer. */
+    synthesize(text: string): Promise<Buffer>;
+    /**
+     * Synthesize text and yield raw PCM_S16LE chunks at the configured
+     * `sampleRate` as they stream in.
+     */
+    synthesizeStream(text: string): AsyncGenerator<Buffer>;
+}
 /** Deepgram streaming STT for Patter pipeline mode. */
 type DeepgramSTTOptions = DeepgramSTTOptions$1 & {
@@ -5488,128 +5879,6 @@ declare class TTS$4 extends OpenAITTS {
     constructor(opts?: OpenAITTSOptions);
 }
-/**
- * Cartesia TTS provider — HTTP `/tts/bytes` endpoint.
- *
- * Cartesia also offers a WebSocket streaming mode with word timestamps;
- * this provider focuses on the chunked-bytes HTTP API which maps cleanly
- * onto Patter's `synthesize(text)` contract and keeps the provider
- * dependency-free (just `fetch`).
- *
- * Default model is `sonic-3` (GA snapshot `sonic-3-2026-01-12`) — Cartesia's
- * current GA model with a documented ~90 ms TTFB target. Voice IDs from the
- * sonic-2 generation (including the default Katie voice) remain compatible.
- *
- * **Telephony optimization** — the constructor default
- * `sampleRate=16000` is correct for web playback, dashboard previews, and
- * 16 kHz pipelines. For real phone calls, use the carrier-specific
- * factories instead:
- *
- * - {@link CartesiaTTS.forTwilio} requests `sampleRate=8000` natively from
- *   Cartesia. Twilio's media-stream WebSocket expects μ-law @ 8 kHz, so
- *   the SDK normally resamples 16 kHz → 8 kHz before doing the PCM →
- *   μ-law transcode in `TwilioAudioSender`. Asking Cartesia for 8 kHz
- *   PCM at the source skips the resample step (saves ~10–30 ms first-
- *   byte plus per-frame CPU and removes a potential aliasing source).
- *   The PCM → μ-law transcode still happens client-side.
- * - {@link CartesiaTTS.forTelnyx} requests `sampleRate=16000`. Telnyx
- *   negotiates L16/16000 on its bidirectional media WebSocket, so
- *   16 kHz PCM is already the format used end-to-end and no
- *   transcoding happens. This is the same as the bare-constructor
- *   default and exists for API symmetry with the Twilio factory.
- */
-/** Known Cartesia TTS models. */
-declare const CartesiaTTSModel: {
-    readonly SONIC_3: "sonic-3";
-    readonly SONIC_2: "sonic-2";
-    readonly SONIC: "sonic";
-};
-type CartesiaTTSModel = (typeof CartesiaTTSModel)[keyof typeof CartesiaTTSModel];
-/** Common PCM sample rates accepted by the Cartesia bytes endpoint. */
-declare const CartesiaTTSSampleRate: {
-    readonly HZ_8000: 8000;
-    readonly HZ_16000: 16000;
-    readonly HZ_22050: 22050;
-    readonly HZ_24000: 24000;
-    readonly HZ_44100: 44100;
-};
-type CartesiaTTSSampleRate = (typeof CartesiaTTSSampleRate)[keyof typeof CartesiaTTSSampleRate];
-/** Constructor options for {@link CartesiaTTS}. */
-interface CartesiaTTSOptions$1 {
-    model?: CartesiaTTSModel | string;
-    voice?: string;
-    language?: string;
-    sampleRate?: CartesiaTTSSampleRate | number;
-    speed?: string | number;
-    emotion?: string | string[];
-    volume?: number;
-    baseUrl?: string;
-    apiVersion?: string;
-}
-/** Cartesia TTS provider backed by the HTTP `/tts/bytes` streaming endpoint. */
-declare class CartesiaTTS {
-    /** Stable pricing/dashboard key — read by stream-handler/metrics. */
-    static readonly providerKey = "cartesia_tts";
-    private readonly apiKey;
-    private readonly model;
-    private readonly voice;
-    private readonly language;
-    private readonly sampleRate;
-    private readonly speed?;
-    private readonly emotion?;
-    private readonly volume?;
-    private readonly baseUrl;
-    private readonly apiVersion;
-    constructor(apiKey: string, opts?: CartesiaTTSOptions$1);
-    /**
-     * Construct an instance pre-configured for Twilio Media Streams.
-     *
-     * Sets `sampleRate=8000` so Cartesia emits PCM_S16LE @ 8 kHz directly.
-     * Twilio's media stream uses μ-law @ 8 kHz so the SDK still does the
-     * PCM → μ-law transcode client-side, but the 16 kHz → 8 kHz resample
-     * step is skipped. Saves ~10–30 ms first-byte plus per-frame CPU and
-     * removes a potential aliasing source.
-     */
-    static forTwilio(apiKey: string, options?: Omit<CartesiaTTSOptions$1, 'sampleRate'>): CartesiaTTS;
-    /**
-     * Construct an instance pre-configured for Telnyx bidirectional media.
-     *
-     * Sets `sampleRate=16000` to match Telnyx's L16/16000 default codec —
-     * audio flows end-to-end with zero resampling or transcoding. Same as
-     * the bare-constructor default; exists for API symmetry with
-     * {@link CartesiaTTS.forTwilio}.
-     */
-    static forTelnyx(apiKey: string, options?: Omit<CartesiaTTSOptions$1, 'sampleRate'>): CartesiaTTS;
-    /** Build the JSON payload for the Cartesia bytes endpoint. */
-    private buildPayload;
-    /**
-     * Pre-call HTTP warmup for the Cartesia `/tts/bytes` endpoint.
-     *
-     * Issues a lightweight `GET <baseUrl>/voices` so DNS, TLS, and HTTP/2
-     * are already up by the time the first `synthesizeStream()` POST
-     * lands. Best-effort: 5 s timeout, all exceptions swallowed at
-     * debug level.
-     *
-     * Billing safety: `GET /voices` is a free metadata read on
-     * Cartesia's REST surface (per https://docs.cartesia.ai). It does
-     * not consume synthesis credits. The actual synthesis is billed
-     * only when `POST /tts/bytes` runs with a non-empty `transcript`.
-     *
-     * Note: Cartesia TTS uses the HTTP path (vs the WebSocket variant
-     * Cartesia also exposes) — connection warmup is therefore HTTP-GET
-     * based, not WebSocket pre-handshake. The latency win is smaller
-     * (~50-150 ms vs the ~200-500 ms of a WS prewarm) but still real.
-     */
-    warmup(): Promise<void>;
-    /** Synthesize text and return the concatenated audio buffer. */
-    synthesize(text: string): Promise<Buffer>;
-    /**
-     * Synthesize text and yield raw PCM_S16LE chunks at the configured
-     * `sampleRate` as they arrive from Cartesia.
-     */
-    synthesizeStream(text: string): AsyncGenerator<Buffer>;
-}
 /** Cartesia TTS for Patter pipeline mode. */
 /** Constructor options for the Cartesia `TTS` adapter. */
@@ -5658,52 +5927,6 @@ declare class TTS$3 extends CartesiaTTS {
     static forTelnyx(apiKey: string, options?: Omit<CartesiaTTSOptions, "sampleRate">): TTS$3;
 }
-/** Constructor options for {@link RimeTTS}. */
-interface RimeTTSOptions$1 {
-    model?: string;
-    speaker?: string;
-    lang?: string;
-    sampleRate?: number;
-    repetitionPenalty?: number;
-    temperature?: number;
-    topP?: number;
-    maxTokens?: number;
-    speedAlpha?: number;
-    reduceLatency?: boolean;
-    pauseBetweenBrackets?: boolean;
-    phonemizeBetweenBrackets?: boolean;
-    baseUrl?: string;
-}
-/** Rime TTS adapter for the `users.rime.ai/v1/rime-tts` HTTP streaming endpoint. */
-declare class RimeTTS {
-    /** Stable pricing/dashboard key — read by stream-handler/metrics. */
-    static readonly providerKey = "rime";
-    private readonly apiKey;
-    private readonly model;
-    private readonly speaker;
-    private readonly lang;
-    private readonly sampleRate;
-    private readonly repetitionPenalty?;
-    private readonly temperature?;
-    private readonly topP?;
-    private readonly maxTokens?;
-    private readonly speedAlpha?;
-    private readonly reduceLatency?;
-    private readonly pauseBetweenBrackets?;
-    private readonly phonemizeBetweenBrackets?;
-    private readonly baseUrl;
-    private readonly totalTimeoutMs;
-    constructor(apiKey: string, opts?: RimeTTSOptions$1);
-    private buildPayload;
-    /** Synthesize text and return the concatenated audio buffer. */
-    synthesize(text: string): Promise<Buffer>;
-    /**
-     * Synthesize text and yield raw PCM_S16LE chunks at the configured
-     * `sampleRate` as they stream in.
-     */
-    synthesizeStream(text: string): AsyncGenerator<Buffer>;
-}
 /** Rime TTS for Patter pipeline mode. */
 /** Constructor options for the Rime `TTS` adapter. */
@@ -6743,6 +6966,41 @@ declare class OpenAIRealtime2Adapter extends OpenAIRealtimeAdapter {
      * output}` + `output_modalities` + `session.type === "realtime"`.
      */
     connect(): Promise<void>;
+    /**
+     * GA-API variant of {@link OpenAIRealtimeAdapter.openParkedConnection}.
+     * Opens a fresh Realtime WS against the GA endpoint, exchanges
+     * `session.created` → GA-shape `session.update` → `session.updated`
+     * so the upstream session is fully primed, and returns the OPEN
+     * socket WITHOUT taking it on `this.ws` or arming the heartbeat /
+     * message listener.
+     *
+     * Used by `Patter.parkProviderConnections` during the carrier
+     * ringing window so the per-call `StreamHandler` can adopt the
+     * primed socket at carrier `start` — eliminating the TCP + TLS +
+     * HTTP-101 + `session.update` ack round-trip from the critical path.
+     * Saves ~300-600 ms of first-audible-word latency.
+     *
+     * Bounded by 8 s. Throws on timeout / handshake failure / GA-side
+     * rejection. Callers treat any error as a cache miss and fall
+     * through to the cold {@link connect} path.
+     *
+     * Billing safety: confirmed by OpenAI's Managing Realtime Costs
+     * guide — `session.update` does NOT invoke the model and bills no
+     * tokens. An idle parked socket costs $0.
+     */
+    openParkedConnection(): Promise<WebSocket__default>;
+    /**
+     * GA-API variant of {@link OpenAIRealtimeAdapter.adoptWebSocket}. Takes
+     * over a WS that {@link openParkedConnection} produced (already through
+     * `session.created` + `session.update` + `session.updated`) and arms
+     * the heartbeat + message listener so the GA event-translation shim
+     * is wired up. Skips the cold-connect path — saves ~300-600 ms on
+     * first audible word.
+     *
+     * Caller MUST verify `ws.readyState === OPEN` before calling. If the
+     * parked WS died between park and adopt, fall back to {@link connect}.
+     */
+    adoptWebSocket(ws: WebSocket__default): void;
     /**
      * GA-API variant of {@link OpenAIRealtimeAdapter.sendFirstMessage}. Two
      * differences from the v1 path:
@@ -7430,10 +7688,18 @@ declare class TwilioAdapter {
     /** Place an outbound call. Returns the Twilio call SID. */
     initiateCall(opts: InitiateCallOptions$1): Promise<InitiateCallResult$1>;
     /**
-     * Build a minimal ``<Response><Connect><Stream url="..."/></Connect></Response>``
-     * TwiML document. Mirrors the Python adapter's ``generate_stream_twiml``.
+     * Build a ``<Response><Connect><Stream url="...">`` TwiML document.
+     *
+     * ``parameters`` is forwarded as ``<Parameter name="..." value="..."/>``
+     * children of ``<Stream>``. Twilio Media Streams strips query-string params
+     * from the ``<Stream url=...>`` before the WS handshake, so
+     * ``<Parameter>`` tags are the supported way to pre-populate
+     * ``start.customParameters`` on the WS ``start`` frame. Used by the
+     * inbound path to carry caller / callee through to the bridge.
+     *
+     * Mirrors the Python adapter's ``generate_stream_twiml``.
      */
-    static generateStreamTwiml(streamUrl: string): string;
+    static generateStreamTwiml(streamUrl: string, parameters?: Record<string, string>): string;
     /** Force-complete an in-progress call. */
     endCall(callSid: string): Promise<void>;
 }
@@ -7665,4 +7931,4 @@ interface CallEvent {
     readonly direction?: string;
 }
-export { type AgentOptions, type AgentState, AllProvidersFailedError, type AnthropicConversion, LLM$3 as AnthropicLLM, type AnthropicLLMOptions, type AnthropicMessage, AssemblyAIEncoding, AssemblyAIModel, STT$1 as AssemblyAISTT, type AssemblyAISTTOptions, type AudioConfig, type AudioSource, AuthenticationError, type BackgroundAudioOptions, BackgroundAudioPlayer, type EvaluateContext as BargeInEvaluateContext, type BargeInStrategy, BuiltinAudioClip, type BuiltinAudioClipName, type BuiltinPcmSource, type CallControl, type CallEvent, type CallEventHandler, type CallMetrics, CallMetricsAccumulator, type CallRecord, type CartesiaEncoding, STT$3 as CartesiaSTT, type CartesiaSTTOptions, TTS$3 as CartesiaTTS, type CartesiaTTSOptions, LLM$1 as CerebrasLLM, type CerebrasLLMOptions, ChatContext, type ChatMessage, type ChatRole, CloudflareTunnel, type ConversationStateSnapshot, type CostBreakdown, DEFAULT_MIN_SENTENCE_LEN, DEFAULT_PRICING, DTMF_EVENTS, DeepFilterNetFilter, type DeepFilterNetOptions, STT$6 as DeepgramSTT, type DeepgramSTTOptions, DefaultToolExecutor, type DefaultToolExecutorOptions, type DefineToolInput, type DtmfEvent, ConvAI as ElevenLabsConvAI, ElevenLabsConvAIAdapter, type ConvAIOptions as ElevenLabsConvAIOptions, ElevenLabsTTS as ElevenLabsRestTTS, TTS$6 as ElevenLabsTTS, type ElevenLabsTTSOptions, type ElevenLabsWebSocketOptions, TTS$5 as ElevenLabsWebSocketTTS, type EouTrigger, ErrorCode, EventBus, FallbackLLMProvider, type FallbackLLMProviderOptions, type FilePcmSource, GEMINI_DEFAULT_INPUT_SR, GEMINI_DEFAULT_OUTPUT_SR, GeminiLiveAdapter, type GeminiLiveEventHandler, LLM as GoogleLLM, type GoogleLLMOptions, LLM$2 as GroqLLM, type GroqLLMOptions, Guardrail$1 as Guardrail, type GuardrailOptions, type HookContext, IVRActivity, type IVRActivityOptions, type IVRToolDefinition, type IncomingMessage, type InitTracingOptions, TTS as InworldTTS, type InworldTTSOptions, type JobCallback, KrispFrameDuration, KrispSampleRate, KrispVivaFilter, type KrispVivaFilterOptions, type LLMChunk, LLMLoop, type LLMProvider, LMNTAudioFormat, LMNTModel, LMNTSampleRate, TTS$1 as LMNTTTS, type LMNTTTSOptions, type LatencyBreakdown, type LocalCallOptions, type LocalConfig, type LocalOptions, type Logger, type LoopCallback, type MessageHandler, MetricsStore, MinWordsStrategy, type MinWordsStrategyOptions, Ngrok, LLM$4 as OpenAILLM, type OpenAILLMOptions, OpenAILLMProvider, type OpenAIMessage, Realtime as OpenAIRealtime, Realtime2 as OpenAIRealtime2, OpenAIRealtime2Adapter, type Realtime2Options as OpenAIRealtime2Options, OpenAIRealtimeAdapter, type RealtimeOptions as OpenAIRealtimeOptions, TTS$4 as OpenAITTS, type OpenAITTSOptions, STT$4 as OpenAITranscribeSTT, type OpenAITranscribeSTTOptions, type ParamSpec, PartialStreamError, Patter, PatterConnectionError, PatterError, type PatterEventType, PatterTool, type PatterToolExecuteArgs, type PatterToolOptions, type PatterToolResult, PcmCarry, PipelineHookExecutor, type PipelineHooks, type PipelineMessageHandler, type ProviderPricing, ProvisionError, RateLimitError, type RawPcmSource, type RealtimeConfig, RemoteMessageHandler, TTS$2 as RimeTTS, type RimeTTSOptions, SPAN_BARGEIN, SPAN_CALL, SPAN_ENDPOINT, SPAN_LLM, SPAN_STT, SPAN_TOOL, SPAN_TTS, type SSEEvent, type STTConfig, type ScheduleHandle, SentenceChunker, type ServeOptions, type SilenceCallback, type SileroSampleRate, SileroVAD, type SileroVADOptions, STT$2 as SonioxSTT, type SonioxSTTOptions$1 as SonioxSTTOptions, type Span, type SpeechEventCallback, SpeechEvents, SpeechmaticsAudioEncoding, SpeechmaticsOperatingPoint, STT as SpeechmaticsSTT, type SpeechmaticsSTTOptions, SpeechmaticsSampleRate, SpeechmaticsServerMessage, TurnDetectionMode as SpeechmaticsTurnDetectionMode, StatefulResampler, type StatefulResamplerOptions, Static as StaticTunnel, type TTSConfig, Carrier as Telnyx, TelnyxAdapter, type TelnyxCarrierOptions, type ConfigureNumberOptions as TelnyxConfigureNumberOptions, type EndCallOptions as TelnyxEndCallOptions, type InitiateCallOptions as TelnyxInitiateCallOptions, type InitiateCallResult as TelnyxInitiateCallResult, type ProvisionNumberOptions as TelnyxProvisionNumberOptions, type ProvisionNumberResult as TelnyxProvisionNumberResult, TelnyxSTT, TelnyxSTTInputFormat, TelnyxSTTSampleRate, type Transcript as TelnyxSTTTranscript, TelnyxTTS, TelnyxTTSSampleRate, TelnyxTTSVoice, type TelnyxTranscriptionEngine, TestSession, TfidfLoopDetector, type TfidfLoopDetectorOptions, Tool, type ToolDefinition, type ToolExecutor, type ToolHandler, type ToolOptions, type TunnelHandle, type TurnMetrics, Carrier$1 as Twilio, TwilioAdapter, type TwilioAdapterOptions, type TwilioCarrierOptions, type ConfigureNumberOptions$1 as TwilioConfigureNumberOptions, type InitiateCallOptions$1 as TwilioInitiateCallOptions, type InitiateCallResult$1 as TwilioInitiateCallResult, type ProvisionNumberOptions$1 as TwilioProvisionNumberOptions, type ProvisionNumberResult$1 as TwilioProvisionNumberResult, ULTRAVOX_DEFAULT_API_BASE, ULTRAVOX_DEFAULT_SR, type UltravoxEventHandler, UltravoxRealtimeAdapter, type UserState, STT$5 as WhisperSTT, type WhisperSTTOptions, assemblyai, builtinClipPath, calculateRealtimeCost, calculateSttCost, calculateTelephonyCost, calculateTtsCost, callsToCsv, callsToJson, cartesia, createResampler16kTo8k, createResampler24kTo16k, createResampler24kTo8k, createResampler8kTo16k, deepgram, defineTool, elevenlabs, evaluateStrategies as evaluateBargeInStrategies, filterEmoji, filterForTTS, filterMarkdown, formatDtmf, geminiLive, getLogger, guardrail, initTracing, isRemoteUrl, isTracingEnabled, isWebSocketUrl, lmnt, makeAuthMiddleware, mergePricing, mixPcm, mountApi, mountDashboard, mulawToPcm16, notifyDashboard, openaiTts, pcm16ToMulaw, resample16kTo8k, resample24kTo16k, resample8kTo16k, resamplePcm, resetStrategies as resetBargeInStrategies, rime, scheduleCron, scheduleInterval, scheduleOnce, selectSoundFromList, setLogger, soniox, speechmatics, startSpan, startTunnel, tool, ultravox, whisper };
+export { type AgentOptions, type AgentState, AllProvidersFailedError, type AnthropicConversion, LLM$3 as AnthropicLLM, type AnthropicLLMOptions, type AnthropicMessage, AssemblyAIEncoding, AssemblyAIModel, STT$1 as AssemblyAISTT, type AssemblyAISTTOptions, type AudioConfig, type AudioSource, AuthenticationError, type BackgroundAudioOptions, BackgroundAudioPlayer, type EvaluateContext as BargeInEvaluateContext, type BargeInStrategy, BuiltinAudioClip, type BuiltinAudioClipName, type BuiltinPcmSource, type CallControl, type CallEvent, type CallEventHandler, type CallMetrics, CallMetricsAccumulator, type CallRecord, type CartesiaEncoding, STT$3 as CartesiaSTT, type CartesiaSTTOptions, TTS$3 as CartesiaTTS, CartesiaTTSModel, type CartesiaTTSOptions, CartesiaTTSVoiceMode, LLM$1 as CerebrasLLM, type CerebrasLLMOptions, ChatContext, type ChatMessage, type ChatRole, CloudflareTunnel, type ConversationStateSnapshot, type CostBreakdown, DEFAULT_MIN_SENTENCE_LEN, DEFAULT_PRICING, DTMF_EVENTS, DeepFilterNetFilter, type DeepFilterNetOptions, DeepgramModel, STT$6 as DeepgramSTT, type DeepgramSTTOptions, DefaultToolExecutor, type DefaultToolExecutorOptions, type DefineToolInput, type DtmfEvent, ConvAI as ElevenLabsConvAI, ElevenLabsConvAIAdapter, type ConvAIOptions as ElevenLabsConvAIOptions, ElevenLabsModel, ElevenLabsOutputFormat, ElevenLabsTTS as ElevenLabsRestTTS, TTS$6 as ElevenLabsTTS, type ElevenLabsTTSOptions, type ElevenLabsWebSocketOptions, TTS$5 as ElevenLabsWebSocketTTS, type EouTrigger, ErrorCode, EventBus, FallbackLLMProvider, type FallbackLLMProviderOptions, type FilePcmSource, GEMINI_DEFAULT_INPUT_SR, GEMINI_DEFAULT_OUTPUT_SR, GeminiLiveAdapter, type GeminiLiveEventHandler, LLM as GoogleLLM, type GoogleLLMOptions, LLM$2 as GroqLLM, type GroqLLMOptions, Guardrail$1 as Guardrail, type GuardrailOptions, type HookContext, IVRActivity, type IVRActivityOptions, type IVRToolDefinition, type IncomingMessage, type InitTracingOptions, TTS as InworldTTS, type InworldTTSOptions, type JobCallback, KrispFrameDuration, KrispSampleRate, KrispVivaFilter, type KrispVivaFilterOptions, type LLMChunk, LLMLoop, type LLMProvider, LMNTAudioFormat, LMNTModel, LMNTSampleRate, TTS$1 as LMNTTTS, type LMNTTTSOptions, type LatencyBreakdown, type LocalCallOptions, type LocalConfig, type LocalOptions, type Logger, type LoopCallback, type MessageHandler, MetricsStore, MinWordsStrategy, type MinWordsStrategyOptions, type ModelPricing, Ngrok, LLM$4 as OpenAILLM, type OpenAILLMOptions, OpenAILLMProvider, type OpenAIMessage, Realtime as OpenAIRealtime, Realtime2 as OpenAIRealtime2, OpenAIRealtime2Adapter, type Realtime2Options as OpenAIRealtime2Options, OpenAIRealtimeAdapter, OpenAIRealtimeAudioFormat, OpenAIRealtimeModel, type RealtimeOptions as OpenAIRealtimeOptions, OpenAIRealtimeVADType, TTS$4 as OpenAITTS, type OpenAITTSOptions, STT$4 as OpenAITranscribeSTT, type OpenAITranscribeSTTOptions, OpenAITranscriptionModel, OpenAIVoice, PRICING_LAST_UPDATED, PRICING_VERSION, type ParamSpec, PartialStreamError, Patter, PatterConnectionError, PatterError, type PatterEventType, PatterTool, type PatterToolExecuteArgs, type PatterToolOptions, type PatterToolResult, PcmCarry, PipelineHookExecutor, type PipelineHooks, type PipelineMessageHandler, PricingUnit, type PricingUnitValue, type ProviderPricing, ProvisionError, RateLimitError, type RawPcmSource, type RealtimeConfig, RemoteMessageHandler, RimeAudioFormat, RimeModel, TTS$2 as RimeTTS, type RimeTTSOptions, SPAN_BARGEIN, SPAN_CALL, SPAN_ENDPOINT, SPAN_LLM, SPAN_STT, SPAN_TOOL, SPAN_TTS, type SSEEvent, type STTConfig, type ScheduleHandle, SentenceChunker, type ServeOptions, type SilenceCallback, type SileroSampleRate, SileroVAD, type SileroVADOptions, STT$2 as SonioxSTT, type SonioxSTTOptions$1 as SonioxSTTOptions, type Span, type SpeechEventCallback, SpeechEvents, SpeechmaticsAudioEncoding, SpeechmaticsOperatingPoint, STT as SpeechmaticsSTT, type SpeechmaticsSTTOptions, SpeechmaticsSampleRate, SpeechmaticsServerMessage, TurnDetectionMode as SpeechmaticsTurnDetectionMode, StatefulResampler, type StatefulResamplerOptions, Static as StaticTunnel, type TTSConfig, Carrier as Telnyx, TelnyxAdapter, type TelnyxCarrierOptions, type ConfigureNumberOptions as TelnyxConfigureNumberOptions, type EndCallOptions as TelnyxEndCallOptions, type InitiateCallOptions as TelnyxInitiateCallOptions, type InitiateCallResult as TelnyxInitiateCallResult, type ProvisionNumberOptions as TelnyxProvisionNumberOptions, type ProvisionNumberResult as TelnyxProvisionNumberResult, TelnyxSTT, TelnyxSTTInputFormat, TelnyxSTTSampleRate, type Transcript as TelnyxSTTTranscript, TelnyxTTS, TelnyxTTSSampleRate, TelnyxTTSVoice, type TelnyxTranscriptionEngine, TestSession, TfidfLoopDetector, type TfidfLoopDetectorOptions, Tool, type ToolDefinition, type ToolExecutor, type ToolHandler, type ToolOptions, type TunnelHandle, type TurnMetrics, Carrier$1 as Twilio, TwilioAdapter, type TwilioAdapterOptions, type TwilioCarrierOptions, type ConfigureNumberOptions$1 as TwilioConfigureNumberOptions, type InitiateCallOptions$1 as TwilioInitiateCallOptions, type InitiateCallResult$1 as TwilioInitiateCallResult, type ProvisionNumberOptions$1 as TwilioProvisionNumberOptions, type ProvisionNumberResult$1 as TwilioProvisionNumberResult, ULTRAVOX_DEFAULT_API_BASE, ULTRAVOX_DEFAULT_SR, type UltravoxEventHandler, UltravoxRealtimeAdapter, type UserState, STT$5 as WhisperSTT, type WhisperSTTOptions, assemblyai, builtinClipPath, calculateRealtimeCost, calculateSttCost, calculateTelephonyCost, calculateTtsCost, callsToCsv, callsToJson, cartesia, createResampler16kTo8k, createResampler24kTo16k, createResampler24kTo8k, createResampler8kTo16k, deepgram, defineTool, elevenlabs, evaluateStrategies as evaluateBargeInStrategies, filterEmoji, filterForTTS, filterMarkdown, formatDtmf, geminiLive, getLogger, guardrail, initTracing, isRemoteUrl, isTracingEnabled, isWebSocketUrl, lmnt, makeAuthMiddleware, mergePricing, mixPcm, mountApi, mountDashboard, mulawToPcm16, notifyDashboard, openaiTts, pcm16ToMulaw, resample16kTo8k, resample24kTo16k, resample8kTo16k, resamplePcm, resetStrategies as resetBargeInStrategies, rime, scheduleCron, scheduleInterval, scheduleOnce, selectSoundFromList, setLogger, soniox, speechmatics, startSpan, startTunnel, tool, ultravox, whisper };