npm - @hivegpt/hiveai-angular - Versions diffs - 0.0.583 → 0.0.584 - Mend

@hivegpt/hiveai-angular 0.0.583 → 0.0.584

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (20) hide show

package/fesm2015/hivegpt-hiveai-angular.js CHANGED Viewed

@@ -5,14 +5,16 @@ import { HttpClient, HttpHeaders } from '@angular/common/http';
 import * as i0 from '@angular/core';
 import { Injectable, InjectionToken, Inject, PLATFORM_ID, Optional, NgZone, EventEmitter, Component, Injector, Output, Input, ElementRef, ChangeDetectionStrategy, ChangeDetectorRef, Renderer2, ViewContainerRef, ViewChild, ViewChildren, NgModule, Pipe } from '@angular/core';
 import { DomSanitizer } from '@angular/platform-browser';
-import { BehaviorSubject, of, throwError, Subject, Subscription, merge, concat, timer, combineLatest } from 'rxjs';
-import { switchMap, catchError, filter, take, map, takeUntil, distinctUntilChanged, startWith, tap } from 'rxjs/operators';
+import { BehaviorSubject, of, throwError, Subject, Subscription } from 'rxjs';
+import { switchMap, catchError, filter, take, map, tap } from 'rxjs/operators';
 import { isPlatformBrowser, CommonModule, DOCUMENT } from '@angular/common';
 import { Socket } from 'ngx-socket-io';
 import { Validators, FormBuilder, FormsModule, ReactiveFormsModule } from '@angular/forms';
 import * as SpeechSDK from 'microsoft-cognitiveservices-speech-sdk';
 import * as marked from 'marked';
 import { __awaiter } from 'tslib';
+import { PipecatClient, RTVIEvent } from '@pipecat-ai/client-js';
+import { WebSocketTransport } from '@pipecat-ai/websocket-transport';
 import { MatIconModule } from '@angular/material/icon';
 import { MatSidenavModule } from '@angular/material/sidenav';
 import { QuillModule } from 'ngx-quill';
@@ -805,219 +807,23 @@ AudioAnalyzerService.decorators = [
 ];
 /**
- * Native WebSocket client for voice session (signaling, transcripts, speaking hints).
- * CRITICAL: Uses native WebSocket only. NO Socket.IO, NO ngx-socket-io.
+ * Voice agent orchestrator using the official PipecatClient SDK.
  *
- * Connects to `ws_url` from `POST {baseUrl}/ai/ask-voice-socket`.
- * Parses JSON messages for transcripts and optional assistant/user speaking flags.
- */
-class WebSocketVoiceClientService {
-    constructor(ngZone) {
-        this.ngZone = ngZone;
-        this.ws = null;
-        /** True when {@link disconnect} initiated the close (not counted as remote close). */
-        this.closeInitiatedByClient = false;
-        this.openedSubject = new Subject();
-        this.remoteCloseSubject = new Subject();
-        this.userTranscriptSubject = new Subject();
-        this.botTranscriptSubject = new Subject();
-        this.assistantSpeakingSubject = new Subject();
-        this.serverUserSpeakingSubject = new Subject();
-        this.audioChunkSubject = new Subject();
-        /** Fires once each time the WebSocket reaches OPEN. */
-        this.opened$ = this.openedSubject.asObservable();
-        /** Fires when the socket closes without a client-initiated {@link disconnect}. */
-        this.remoteClose$ = this.remoteCloseSubject.asObservable();
-        this.userTranscript$ = this.userTranscriptSubject.asObservable();
-        this.botTranscript$ = this.botTranscriptSubject.asObservable();
-        /** Assistant/bot speaking, when the server sends explicit events (see {@link handleJsonMessage}). */
-        this.assistantSpeaking$ = this.assistantSpeakingSubject.asObservable();
-        /** User speaking from server-side VAD, if provided. */
-        this.serverUserSpeaking$ = this.serverUserSpeakingSubject.asObservable();
-        /** Binary audio frames from server (when backend streams bot audio over WS). */
-        this.audioChunk$ = this.audioChunkSubject.asObservable();
-    }
-    connect(wsUrl) {
-        var _a;
-        if (((_a = this.ws) === null || _a === void 0 ? void 0 : _a.readyState) === WebSocket.OPEN) {
-            return;
-        }
-        if (this.ws) {
-            this.closeInitiatedByClient = true;
-            this.ws.close();
-        }
-        try {
-            const socket = new WebSocket(wsUrl);
-            this.ws = socket;
-            socket.onopen = () => {
-                if (this.ws !== socket)
-                    return;
-                this.ngZone.run(() => this.openedSubject.next());
-            };
-            socket.onmessage = (event) => {
-                if (this.ws !== socket)
-                    return;
-                void this.handleIncomingMessage(event.data);
-            };
-            socket.onerror = () => {
-                this.ngZone.run(() => {
-                    if (this.ws === socket && socket.readyState !== WebSocket.CLOSED) {
-                        socket.close();
-                    }
-                });
-            };
-            socket.onclose = () => {
-                if (this.ws === socket) {
-                    this.ws = null;
-                }
-                const client = this.closeInitiatedByClient;
-                this.closeInitiatedByClient = false;
-                if (!client) {
-                    this.ngZone.run(() => this.remoteCloseSubject.next());
-                }
-            };
-        }
-        catch (err) {
-            console.error('WebSocketVoiceClient: connect failed', err);
-            this.ws = null;
-            throw err;
-        }
-    }
-    handleIncomingMessage(payload) {
-        return __awaiter(this, void 0, void 0, function* () {
-            if (typeof payload === 'string') {
-                this.handleJsonString(payload);
-                return;
-            }
-            if (payload instanceof ArrayBuffer) {
-                this.handleBinaryMessage(payload);
-                return;
-            }
-            if (payload instanceof Blob) {
-                const ab = yield payload.arrayBuffer();
-                this.handleBinaryMessage(ab);
-            }
-        });
-    }
-    handleJsonString(jsonText) {
-        try {
-            const msg = JSON.parse(jsonText);
-            this.ngZone.run(() => this.handleJsonMessage(msg));
-        }
-        catch (_a) {
-            // Ignore non-JSON
-        }
-    }
-    handleBinaryMessage(buffer) {
-        // Some backends wrap JSON events inside binary WS frames.
-        const maybeText = this.tryDecodeUtf8(buffer);
-        if (maybeText !== null) {
-            this.handleJsonString(maybeText);
-            return;
-        }
-        // Otherwise treat binary as streamed assistant audio.
-        this.ngZone.run(() => this.audioChunkSubject.next(buffer));
-    }
-    tryDecodeUtf8(buffer) {
-        try {
-            const text = new TextDecoder('utf-8', { fatal: true }).decode(buffer);
-            const trimmed = text.trim();
-            if (!trimmed || (trimmed[0] !== '{' && trimmed[0] !== '[')) {
-                return null;
-            }
-            return trimmed;
-        }
-        catch (_a) {
-            return null;
-        }
-    }
-    handleJsonMessage(msg) {
-        const type = msg.type;
-        const typeStr = typeof type === 'string' ? type : '';
-        if (typeStr === 'session_ready' || typeStr === 'connected' || typeStr === 'voice_session_started') {
-            return;
-        }
-        if (typeStr === 'assistant_speaking' ||
-            typeStr === 'bot_speaking') {
-            if (msg.active === true || msg.speaking === true) {
-                this.assistantSpeakingSubject.next(true);
-            }
-            else if (msg.active === false || msg.speaking === false) {
-                this.assistantSpeakingSubject.next(false);
-            }
-            return;
-        }
-        if (typeStr === 'user_speaking') {
-            if (msg.active === true || msg.speaking === true) {
-                this.serverUserSpeakingSubject.next(true);
-            }
-            else if (msg.active === false || msg.speaking === false) {
-                this.serverUserSpeakingSubject.next(false);
-            }
-            return;
-        }
-        if (typeStr === 'input_audio_buffer.speech_started') {
-            this.serverUserSpeakingSubject.next(true);
-            return;
-        }
-        if (typeStr === 'input_audio_buffer.speech_stopped') {
-            this.serverUserSpeakingSubject.next(false);
-            return;
-        }
-        if (typeStr === 'response.audio.delta') {
-            this.assistantSpeakingSubject.next(true);
-            return;
-        }
-        if (typeStr === 'response.audio.done' ||
-            typeStr === 'response.output_audio.done') {
-            this.assistantSpeakingSubject.next(false);
-            return;
-        }
-        if (typeStr === 'user_transcript' && typeof msg.text === 'string') {
-            this.userTranscriptSubject.next({
-                text: msg.text,
-                final: msg.final === true,
-            });
-            return;
-        }
-        if (typeStr === 'bot_transcript' && typeof msg.text === 'string') {
-            this.botTranscriptSubject.next(msg.text);
-        }
-    }
-    disconnect() {
-        if (!this.ws) {
-            return;
-        }
-        this.closeInitiatedByClient = true;
-        this.ws.close();
-    }
-    get isConnected() {
-        var _a;
-        return ((_a = this.ws) === null || _a === void 0 ? void 0 : _a.readyState) === WebSocket.OPEN;
-    }
-}
-WebSocketVoiceClientService.ɵprov = i0.ɵɵdefineInjectable({ factory: function WebSocketVoiceClientService_Factory() { return new WebSocketVoiceClientService(i0.ɵɵinject(i0.NgZone)); }, token: WebSocketVoiceClientService, providedIn: "root" });
-WebSocketVoiceClientService.decorators = [
-    { type: Injectable, args: [{
-                providedIn: 'root',
-            },] }
-];
-WebSocketVoiceClientService.ctorParameters = () => [
-    { type: NgZone }
-];
-/**
- * Voice agent orchestrator: single WebSocket (`ws_url` from POST /ai/ask-voice-socket)
- * for session events, transcripts, and optional speaking hints; local mic for capture
- * and waveform only (no Daily/WebRTC room).
+ * Audio flow (mirrors the React reference implementation):
+ *  - Local mic: acquired by PipecatClient.initDevices(); local track fed to
+ *    AudioAnalyzerService for waveform visualisation.
+ *  - Bot audio: received as a MediaStreamTrack via RTVIEvent.TrackStarted,
+ *    played through a hidden <audio> element.
+ *  - All binary protobuf framing / RTVI protocol handled by
+ *    @pipecat-ai/client-js + @pipecat-ai/websocket-transport.
  */
 class VoiceAgentService {
-    constructor(audioAnalyzer, wsClient, platformTokenRefresh,
+    constructor(audioAnalyzer, platformTokenRefresh, ngZone,
     /** `Object` not `object` — ngc metadata collection rejects the `object` type in DI params. */
     platformId) {
         this.audioAnalyzer = audioAnalyzer;
-        this.wsClient = wsClient;
         this.platformTokenRefresh = platformTokenRefresh;
+        this.ngZone = ngZone;
         this.platformId = platformId;
         this.callStateSubject = new BehaviorSubject('idle');
         this.statusTextSubject = new BehaviorSubject('');
@@ -1029,11 +835,8 @@ class VoiceAgentService {
         this.botTranscriptSubject = new Subject();
         this.callStartTime = 0;
         this.durationInterval = null;
-        this.localMicStream = null;
-        this.remoteAudioContext = null;
-        this.pendingRemoteAudio = [];
-        this.remoteAudioPlaying = false;
-        this.endCall$ = new Subject();
+        this.pcClient = null;
+        this.botAudioElement = null;
         this.subscriptions = new Subscription();
         this.destroy$ = new Subject();
         this.callState$ = this.callStateSubject.asObservable();
@@ -1045,29 +848,17 @@ class VoiceAgentService {
         this.userTranscript$ = this.userTranscriptSubject.asObservable();
         this.botTranscript$ = this.botTranscriptSubject.asObservable();
         this.subscriptions.add(this.audioAnalyzer.audioLevels$.subscribe((levels) => this.audioLevelsSubject.next(levels)));
-        this.subscriptions.add(this.wsClient.remoteClose$
-            .pipe(takeUntil(this.destroy$))
-            .subscribe(() => void this.handleRemoteClose()));
-        this.subscriptions.add(this.wsClient.audioChunk$
-            .pipe(takeUntil(this.destroy$))
-            .subscribe((chunk) => this.enqueueRemoteAudio(chunk)));
     }
     ngOnDestroy() {
         this.destroy$.next();
         this.subscriptions.unsubscribe();
-        this.disconnect();
+        void this.disconnect();
     }
-    /** Reset to idle state (e.g. when modal opens so user can click Start Call). */
+    /** Reset to idle (e.g. when modal re-opens so user can click Start Call). */
     resetToIdle() {
         if (this.callStateSubject.value === 'idle')
             return;
-        this.endCall$.next();
-        this.stopDurationTimer();
-        this.callStartTime = 0;
-        this.audioAnalyzer.stop();
-        this.stopLocalMic();
-        this.resetRemoteAudioPlayback();
-        this.wsClient.disconnect();
+        void this.disconnect();
         this.callStateSubject.next('idle');
         this.statusTextSubject.next('');
         this.durationSubject.next('0:00');
@@ -1075,7 +866,7 @@ class VoiceAgentService {
     connect(apiUrl, token, botId, conversationId, apiKey, eventToken, eventId, eventUrl, domainAuthority, usersApiUrl) {
         return __awaiter(this, void 0, void 0, function* () {
             if (this.callStateSubject.value !== 'idle') {
-                console.warn('Call already in progress');
+                console.warn('[HiveGpt Voice] Call already in progress');
                 return;
             }
             try {
@@ -1088,257 +879,196 @@ class VoiceAgentService {
                             .ensureValidAccessToken(token, usersApiUrl)
                             .pipe(take(1))
                             .toPromise();
-                        if (ensured === null || ensured === void 0 ? void 0 : ensured.accessToken) {
+                        if (ensured === null || ensured === void 0 ? void 0 : ensured.accessToken)
                             accessToken = ensured.accessToken;
-                        }
                     }
                     catch (e) {
-                        console.warn('[HiveGpt Voice] Token refresh before connect failed', e);
+                        console.warn('[HiveGpt Voice] Token refresh failed', e);
                     }
                 }
                 const baseUrl = apiUrl.replace(/\/$/, '');
-                const postUrl = `${baseUrl}/ai/ask-voice-socket`;
-                const headers = {
-                    'Content-Type': 'application/json',
-                    Authorization: `Bearer ${accessToken}`,
-                    'x-api-key': apiKey,
-                    'hive-bot-id': botId,
-                    'domain-authority': domainAuthority,
-                    eventUrl,
-                    eventId,
-                    eventToken,
-                    'ngrok-skip-browser-warning': 'true',
-                };
-                const res = yield fetch(postUrl, {
-                    method: 'POST',
-                    headers,
-                    body: JSON.stringify({
+                const pcClient = new PipecatClient({
+                    transport: new WebSocketTransport(),
+                    enableMic: true,
+                    enableCam: false,
+                    callbacks: {
+                        onConnected: () => this.ngZone.run(() => this.onPipecatConnected()),
+                        onDisconnected: () => this.ngZone.run(() => this.onPipecatDisconnected()),
+                        onBotReady: () => this.ngZone.run(() => this.onBotReady()),
+                        onUserTranscript: (data) => this.ngZone.run(() => this.userTranscriptSubject.next({ text: data.text, final: !!data.final })),
+                        onBotTranscript: (data) => this.ngZone.run(() => this.botTranscriptSubject.next(data.text)),
+                        onError: (err) => {
+                            this.ngZone.run(() => {
+                                console.error('[HiveGpt Voice] PipecatClient error', err);
+                                this.callStateSubject.next('ended');
+                                this.statusTextSubject.next('Connection failed');
+                            });
+                        },
+                    },
+                });
+                this.pcClient = pcClient;
+                // Bot audio arrives as a MediaStreamTrack — wire to a hidden <audio> element
+                pcClient.on(RTVIEvent.TrackStarted, (track, participant) => {
+                    if (!(participant === null || participant === void 0 ? void 0 : participant.local) && track.kind === 'audio') {
+                        this.ngZone.run(() => this.setupBotAudioTrack(track));
+                    }
+                });
+                // Speaking state comes straight from RTVI events
+                pcClient.on(RTVIEvent.BotStartedSpeaking, () => this.ngZone.run(() => this.onBotStartedSpeaking()));
+                pcClient.on(RTVIEvent.BotStoppedSpeaking, () => this.ngZone.run(() => this.onBotStoppedSpeaking()));
+                pcClient.on(RTVIEvent.UserStartedSpeaking, () => this.ngZone.run(() => {
+                    this.isUserSpeakingSubject.next(true);
+                    this.callStateSubject.next('listening');
+                }));
+                pcClient.on(RTVIEvent.UserStoppedSpeaking, () => this.ngZone.run(() => {
+                    this.isUserSpeakingSubject.next(false);
+                    if (this.callStateSubject.value === 'listening') {
+                        this.callStateSubject.next('connected');
+                    }
+                }));
+                // Acquire mic (triggers browser permission prompt)
+                yield pcClient.initDevices();
+                // Build headers using the browser Headers API (required by pipecat's APIRequest type)
+                const requestHeaders = new Headers();
+                requestHeaders.append('Authorization', `Bearer ${accessToken}`);
+                requestHeaders.append('x-api-key', apiKey);
+                requestHeaders.append('hive-bot-id', botId);
+                requestHeaders.append('domain-authority', domainAuthority);
+                requestHeaders.append('eventUrl', eventUrl);
+                requestHeaders.append('eventId', eventId);
+                requestHeaders.append('eventToken', eventToken);
+                requestHeaders.append('ngrok-skip-browser-warning', 'true');
+                // POST to /ai/ask-voice-socket → receives { ws_url } → WebSocketTransport connects
+                yield pcClient.startBotAndConnect({
+                    endpoint: `${baseUrl}/ai/ask-voice-socket`,
+                    headers: requestHeaders,
+                    requestData: {
                         bot_id: botId,
                         conversation_id: conversationId,
                         voice: 'alloy',
-                    }),
+                    },
                 });
-                if (!res.ok) {
-                    throw new Error(`HTTP ${res.status}`);
-                }
-                const json = yield res.json();
-                const wsUrl = (typeof (json === null || json === void 0 ? void 0 : json.ws_url) === 'string' && json.ws_url) ||
-                    (typeof (json === null || json === void 0 ? void 0 : json.rn_ws_url) === 'string' && json.rn_ws_url);
-                if (!wsUrl) {
-                    throw new Error('No ws_url in response');
-                }
-                const untilCallEnds$ = merge(this.destroy$, this.endCall$);
-                this.subscriptions.add(this.wsClient.userTranscript$
-                    .pipe(takeUntil(untilCallEnds$))
-                    .subscribe((t) => this.userTranscriptSubject.next(t)));
-                this.subscriptions.add(this.wsClient.botTranscript$
-                    .pipe(takeUntil(untilCallEnds$))
-                    .subscribe((t) => this.botTranscriptSubject.next(t)));
-                this.subscriptions.add(this.wsClient.opened$
-                    .pipe(takeUntil(untilCallEnds$), take(1))
-                    .subscribe(() => void this.onWebsocketOpened()));
-                this.wsClient.connect(wsUrl);
             }
             catch (error) {
-                console.error('Error connecting voice agent:', error);
+                console.error('[HiveGpt Voice] connect failed', error);
                 this.callStateSubject.next('ended');
-                yield this.disconnect();
+                yield this.cleanupPipecatClient();
                 this.statusTextSubject.next('Connection failed');
                 throw error;
             }
         });
     }
-    onWebsocketOpened() {
-        return __awaiter(this, void 0, void 0, function* () {
-            if (this.callStateSubject.value !== 'connecting') {
-                return;
-            }
-            try {
-                yield this.startLocalMic();
-                this.statusTextSubject.next('Connected');
-                this.callStateSubject.next('connected');
-                this.wireSpeakingState();
-            }
-            catch (err) {
-                console.error('[HiveGpt Voice] Mic or session setup failed', err);
-                this.callStateSubject.next('ended');
-                this.statusTextSubject.next('Microphone unavailable');
-                yield this.disconnect();
-            }
-        });
-    }
-    wireSpeakingState() {
-        const untilCallEnds$ = merge(this.destroy$, this.endCall$);
-        const transcriptDrivenAssistant$ = this.wsClient.botTranscript$.pipe(switchMap(() => concat(of(true), timer(800).pipe(map(() => false)))), distinctUntilChanged());
-        const assistantTalking$ = merge(this.wsClient.assistantSpeaking$, transcriptDrivenAssistant$).pipe(distinctUntilChanged(), startWith(false));
-        const userTalking$ = combineLatest([
-            this.audioAnalyzer.isUserSpeaking$,
-            this.wsClient.serverUserSpeaking$.pipe(startWith(false)),
-        ]).pipe(map(([local, server]) => local || server), distinctUntilChanged(), startWith(false));
-        this.subscriptions.add(combineLatest([assistantTalking$, userTalking$])
-            .pipe(takeUntil(untilCallEnds$))
-            .subscribe(([bot, user]) => {
-            const current = this.callStateSubject.value;
-            if (user) {
-                this.isUserSpeakingSubject.next(true);
-                this.callStateSubject.next('listening');
-            }
-            else {
-                this.isUserSpeakingSubject.next(false);
-            }
-            if (user) {
-                return;
-            }
-            if (bot) {
-                if (this.callStartTime === 0) {
-                    this.callStartTime = Date.now();
-                    this.startDurationTimer();
-                }
-                this.callStateSubject.next('talking');
-            }
-            else if (current === 'talking' || current === 'listening') {
-                this.callStateSubject.next('connected');
-            }
-        }));
+    onPipecatConnected() {
+        this.callStateSubject.next('connected');
+        this.statusTextSubject.next('Connected');
+        this.isMicMutedSubject.next(false);
+        this.startLocalMicAnalyzer();
     }
-    startLocalMic() {
-        return __awaiter(this, void 0, void 0, function* () {
-            this.stopLocalMic();
-            const stream = yield navigator.mediaDevices.getUserMedia({ audio: true });
-            const track = stream.getAudioTracks()[0];
-            if (!track) {
-                stream.getTracks().forEach((t) => t.stop());
-                throw new Error('No audio track');
-            }
-            this.localMicStream = stream;
-            this.isMicMutedSubject.next(!track.enabled);
-            this.audioAnalyzer.start(stream);
-        });
-    }
-    stopLocalMic() {
-        if (this.localMicStream) {
-            this.localMicStream.getTracks().forEach((t) => t.stop());
-            this.localMicStream = null;
-        }
-    }
-    enqueueRemoteAudio(chunk) {
-        this.pendingRemoteAudio.push(chunk.slice(0));
-        if (!this.remoteAudioPlaying) {
-            void this.playRemoteAudioQueue();
-        }
+    onPipecatDisconnected() {
+        this.stopDurationTimer();
+        this.callStartTime = 0;
+        this.audioAnalyzer.stop();
+        this.stopBotAudio();
+        this.callStateSubject.next('ended');
+        this.statusTextSubject.next('Call Ended');
     }
-    playRemoteAudioQueue() {
-        return __awaiter(this, void 0, void 0, function* () {
-            this.remoteAudioPlaying = true;
-            const context = this.getOrCreateRemoteAudioContext();
-            while (this.pendingRemoteAudio.length > 0) {
-                const chunk = this.pendingRemoteAudio.shift();
-                if (!chunk)
-                    continue;
-                try {
-                    const decoded = yield this.decodeAudioChunk(context, chunk);
-                    this.assistantAudioStarted();
-                    yield this.playDecodedBuffer(context, decoded);
-                }
-                catch (_a) {
-                    // Ignore undecodable chunks; server may mix non-audio binary events.
-                }
-            }
-            this.remoteAudioPlaying = false;
-            this.assistantAudioStopped();
-        });
+    onBotReady() {
+        var _a, _b, _c;
+        // Retry track wiring in case tracks weren't ready at onConnected
+        this.startLocalMicAnalyzer();
+        const botTrack = (_c = (_b = (_a = this.pcClient) === null || _a === void 0 ? void 0 : _a.tracks()) === null || _b === void 0 ? void 0 : _b.bot) === null || _c === void 0 ? void 0 : _c.audio;
+        if (botTrack)
+            this.setupBotAudioTrack(botTrack);
     }
-    getOrCreateRemoteAudioContext() {
-        if (!this.remoteAudioContext || this.remoteAudioContext.state === 'closed') {
-            this.remoteAudioContext = new AudioContext();
-        }
-        if (this.remoteAudioContext.state === 'suspended') {
-            void this.remoteAudioContext.resume();
+    startLocalMicAnalyzer() {
+        var _a, _b, _c;
+        const localTrack = (_c = (_b = (_a = this.pcClient) === null || _a === void 0 ? void 0 : _a.tracks()) === null || _b === void 0 ? void 0 : _b.local) === null || _c === void 0 ? void 0 : _c.audio;
+        if (localTrack) {
+            this.audioAnalyzer.start(new MediaStream([localTrack]));
         }
-        return this.remoteAudioContext;
     }
-    decodeAudioChunk(context, chunk) {
-        return new Promise((resolve, reject) => {
-            context.decodeAudioData(chunk.slice(0), resolve, reject);
-        });
-    }
-    playDecodedBuffer(context, buffer) {
-        return new Promise((resolve) => {
-            const source = context.createBufferSource();
-            source.buffer = buffer;
-            source.connect(context.destination);
-            source.onended = () => resolve();
-            source.start();
-        });
-    }
-    assistantAudioStarted() {
+    onBotStartedSpeaking() {
         if (this.callStartTime === 0) {
             this.callStartTime = Date.now();
             this.startDurationTimer();
         }
         this.callStateSubject.next('talking');
     }
-    assistantAudioStopped() {
+    onBotStoppedSpeaking() {
         if (this.callStateSubject.value === 'talking') {
             this.callStateSubject.next('connected');
         }
     }
-    resetRemoteAudioPlayback() {
-        this.pendingRemoteAudio = [];
-        this.remoteAudioPlaying = false;
-        if (this.remoteAudioContext && this.remoteAudioContext.state !== 'closed') {
-            this.remoteAudioContext.close().catch(() => { });
+    setupBotAudioTrack(track) {
+        var _a;
+        if (!this.botAudioElement) {
+            this.botAudioElement = new Audio();
+            this.botAudioElement.autoplay = true;
         }
-        this.remoteAudioContext = null;
+        const existing = (_a = this.botAudioElement.srcObject) === null || _a === void 0 ? void 0 : _a.getAudioTracks()[0];
+        if ((existing === null || existing === void 0 ? void 0 : existing.id) === track.id)
+            return;
+        this.botAudioElement.srcObject = new MediaStream([track]);
+        this.botAudioElement.play().catch((err) => console.warn('[HiveGpt Voice] Bot audio play blocked', err));
     }
-    handleRemoteClose() {
-        return __awaiter(this, void 0, void 0, function* () {
-            const state = this.callStateSubject.value;
-            if (state === 'idle' || state === 'ended')
-                return;
-            this.endCall$.next();
-            this.stopDurationTimer();
-            this.callStartTime = 0;
-            this.audioAnalyzer.stop();
-            this.stopLocalMic();
-            this.resetRemoteAudioPlayback();
-            this.callStateSubject.next('ended');
-            this.statusTextSubject.next('Connection lost');
-        });
+    stopBotAudio() {
+        var _a;
+        if (this.botAudioElement) {
+            try {
+                this.botAudioElement.pause();
+                (_a = this.botAudioElement.srcObject) === null || _a === void 0 ? void 0 : _a.getAudioTracks().forEach((t) => t.stop());
+                this.botAudioElement.srcObject = null;
+            }
+            catch (_b) {
+                // ignore
+            }
+            this.botAudioElement = null;
+        }
     }
     disconnect() {
         return __awaiter(this, void 0, void 0, function* () {
-            this.endCall$.next();
             this.stopDurationTimer();
             this.callStartTime = 0;
             this.audioAnalyzer.stop();
-            this.stopLocalMic();
-            this.resetRemoteAudioPlayback();
-            this.wsClient.disconnect();
+            this.stopBotAudio();
+            yield this.cleanupPipecatClient();
             this.callStateSubject.next('ended');
             this.statusTextSubject.next('Call Ended');
         });
     }
+    cleanupPipecatClient() {
+        return __awaiter(this, void 0, void 0, function* () {
+            if (this.pcClient) {
+                try {
+                    yield this.pcClient.disconnect();
+                }
+                catch (_a) {
+                    // ignore
+                }
+                this.pcClient = null;
+            }
+        });
+    }
     toggleMic() {
-        var _a;
+        if (!this.pcClient)
+            return;
         const nextMuted = !this.isMicMutedSubject.value;
-        const track = (_a = this.localMicStream) === null || _a === void 0 ? void 0 : _a.getAudioTracks()[0];
-        if (track) {
-            track.enabled = !nextMuted;
-        }
+        this.pcClient.enableMic(!nextMuted);
         this.isMicMutedSubject.next(nextMuted);
+        if (nextMuted)
+            this.isUserSpeakingSubject.next(false);
     }
     startDurationTimer() {
-        const updateDuration = () => {
+        const tick = () => {
             if (this.callStartTime > 0) {
                 const elapsed = Math.floor((Date.now() - this.callStartTime) / 1000);
-                const minutes = Math.floor(elapsed / 60);
-                const seconds = elapsed % 60;
-                this.durationSubject.next(`${minutes}:${String(seconds).padStart(2, '0')}`);
+                const m = Math.floor(elapsed / 60);
+                const s = elapsed % 60;
+                this.durationSubject.next(`${m}:${String(s).padStart(2, '0')}`);
             }
         };
-        updateDuration();
-        this.durationInterval = setInterval(updateDuration, 1000);
+        tick();
+        this.durationInterval = setInterval(tick, 1000);
     }
     stopDurationTimer() {
         if (this.durationInterval) {
@@ -1347,7 +1077,7 @@ class VoiceAgentService {
         }
     }
 }
-VoiceAgentService.ɵprov = i0.ɵɵdefineInjectable({ factory: function VoiceAgentService_Factory() { return new VoiceAgentService(i0.ɵɵinject(AudioAnalyzerService), i0.ɵɵinject(WebSocketVoiceClientService), i0.ɵɵinject(PlatformTokenRefreshService), i0.ɵɵinject(i0.PLATFORM_ID)); }, token: VoiceAgentService, providedIn: "root" });
+VoiceAgentService.ɵprov = i0.ɵɵdefineInjectable({ factory: function VoiceAgentService_Factory() { return new VoiceAgentService(i0.ɵɵinject(AudioAnalyzerService), i0.ɵɵinject(PlatformTokenRefreshService), i0.ɵɵinject(i0.NgZone), i0.ɵɵinject(i0.PLATFORM_ID)); }, token: VoiceAgentService, providedIn: "root" });
 VoiceAgentService.decorators = [
     { type: Injectable, args: [{
                 providedIn: 'root',
@@ -1355,8 +1085,8 @@ VoiceAgentService.decorators = [
 ];
 VoiceAgentService.ctorParameters = () => [
     { type: AudioAnalyzerService },
-    { type: WebSocketVoiceClientService },
     { type: PlatformTokenRefreshService },
+    { type: NgZone },
     { type: Object, decorators: [{ type: Inject, args: [PLATFORM_ID,] }] }
 ];
@@ -5395,8 +5125,8 @@ ChatBotComponent.propDecorators = {
 };
 /**
- * Voice agent module. Uses native WebSocket for the voice session.
- * Does NOT use Socket.IO or ngx-socket-io.
+ * Voice agent module. Uses @pipecat-ai/client-js + @pipecat-ai/websocket-transport
+ * (peer dependencies) for WebSocket transport, RTVI protocol, and audio.
  */
 class VoiceAgentModule {
 }
@@ -5411,7 +5141,6 @@ VoiceAgentModule.decorators = [
                 providers: [
                     VoiceAgentService,
                     AudioAnalyzerService,
-                    WebSocketVoiceClientService
                 ],
                 exports: [
                     VoiceAgentModalComponent
@@ -5682,5 +5411,5 @@ HiveGptModule.decorators = [
  * Generated bundle index. Do not edit.
  */
-export { AudioAnalyzerService, ChatBotComponent, ChatDrawerComponent, HIVEGPT_AUTH_STORAGE_KEY, HiveGptModule, PlatformTokenRefreshService, VOICE_MODAL_CLOSE_CALLBACK, VOICE_MODAL_CONFIG, VoiceAgentModalComponent, VoiceAgentModule, VoiceAgentService, eClassificationType, hiveGptAuthStorageKeyFactory, BotsService as ɵa, SocketService as ɵb, ConversationService as ɵc, NotificationSocket as ɵd, TranslationService as ɵe, WebSocketVoiceClientService as ɵf, VideoPlayerComponent as ɵg, SafeHtmlPipe as ɵh, BotHtmlEditorComponent as ɵi };
+export { AudioAnalyzerService, ChatBotComponent, ChatDrawerComponent, HIVEGPT_AUTH_STORAGE_KEY, HiveGptModule, PlatformTokenRefreshService, VOICE_MODAL_CLOSE_CALLBACK, VOICE_MODAL_CONFIG, VoiceAgentModalComponent, VoiceAgentModule, VoiceAgentService, eClassificationType, hiveGptAuthStorageKeyFactory, BotsService as ɵa, SocketService as ɵb, ConversationService as ɵc, NotificationSocket as ɵd, TranslationService as ɵe, VideoPlayerComponent as ɵf, SafeHtmlPipe as ɵg, BotHtmlEditorComponent as ɵh };
 //# sourceMappingURL=hivegpt-hiveai-angular.js.map