npm - @memori.ai/memori-react - Versions diffs - 7.34.2 → 8.0.0-rc.1 - Mend

@memori.ai/memori-react 7.34.2 → 8.0.0-rc.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (54) hide show

package/CHANGELOG.md +35 -0
package/dist/components/Chat/Chat.d.ts +1 -0
package/dist/components/Chat/Chat.js +2 -2
package/dist/components/Chat/Chat.js.map +1 -1
package/dist/components/ChatInputs/ChatInputs.d.ts +1 -0
package/dist/components/ChatInputs/ChatInputs.js +3 -3
package/dist/components/ChatInputs/ChatInputs.js.map +1 -1
package/dist/components/MemoriWidget/MemoriWidget.d.ts +3 -3
package/dist/components/MemoriWidget/MemoriWidget.js +138 -425
package/dist/components/MemoriWidget/MemoriWidget.js.map +1 -1
package/dist/context/visemeContext.js +39 -30
package/dist/context/visemeContext.js.map +1 -1
package/dist/helpers/sanitizer.d.ts +6 -0
package/dist/helpers/sanitizer.js +41 -0
package/dist/helpers/sanitizer.js.map +1 -0
package/dist/helpers/tts/ttsVoiceUtility.d.ts +158 -0
package/dist/helpers/tts/ttsVoiceUtility.js +192 -0
package/dist/helpers/tts/ttsVoiceUtility.js.map +1 -0
package/dist/helpers/tts/useTTS.d.ts +26 -0
package/dist/helpers/tts/useTTS.js +274 -0
package/dist/helpers/tts/useTTS.js.map +1 -0
package/dist/index.js +12 -7
package/dist/index.js.map +1 -1
package/esm/components/Chat/Chat.d.ts +1 -0
package/esm/components/Chat/Chat.js +2 -2
package/esm/components/Chat/Chat.js.map +1 -1
package/esm/components/ChatInputs/ChatInputs.d.ts +1 -0
package/esm/components/ChatInputs/ChatInputs.js +3 -3
package/esm/components/ChatInputs/ChatInputs.js.map +1 -1
package/esm/components/MemoriWidget/MemoriWidget.d.ts +3 -3
package/esm/components/MemoriWidget/MemoriWidget.js +139 -426
package/esm/components/MemoriWidget/MemoriWidget.js.map +1 -1
package/esm/context/visemeContext.js +39 -30
package/esm/context/visemeContext.js.map +1 -1
package/esm/helpers/sanitizer.d.ts +6 -0
package/esm/helpers/sanitizer.js +32 -0
package/esm/helpers/sanitizer.js.map +1 -0
package/esm/helpers/tts/ttsVoiceUtility.d.ts +158 -0
package/esm/helpers/tts/ttsVoiceUtility.js +182 -0
package/esm/helpers/tts/ttsVoiceUtility.js.map +1 -0
package/esm/helpers/tts/useTTS.d.ts +26 -0
package/esm/helpers/tts/useTTS.js +270 -0
package/esm/helpers/tts/useTTS.js.map +1 -0
package/esm/index.js +12 -7
package/esm/index.js.map +1 -1
package/package.json +2 -2
package/src/components/Chat/Chat.tsx +3 -0
package/src/components/ChatInputs/ChatInputs.tsx +4 -2
package/src/components/MemoriWidget/MemoriWidget.tsx +246 -637
package/src/context/visemeContext.tsx +77 -55
package/src/helpers/sanitizer.ts +71 -0
package/src/helpers/tts/ttsVoiceUtility.ts +275 -0
package/src/helpers/tts/useTTS.ts +431 -0
package/src/index.tsx +14 -10

package/src/helpers/tts/useTTS.ts ADDED Viewed

@@ -0,0 +1,431 @@
+// Improved useTTS.ts with better viseme handling
+import { useState, useCallback, useEffect, useRef } from 'react';
+import { sanitizeText } from '../sanitizer';
+import { getLocalConfig } from '../configuration';
+import Alert from '../../components/ui/Alert';
+import { useViseme } from '../../context/visemeContext';
+import { IAudioContext } from 'standardized-audio-context';
+/**
+ * Configurazione per il TTS
+ */
+export interface TTSConfig {
+  provider: 'azure' | 'openai';
+  voice?: string;
+  model?: string;
+  region?: string; // richiesto per Azure
+  tenant?: string; // Tenant identifier for multi-tenant applications
+}
+type VisemeData = {
+  visemeId: number;
+  audioOffset: number;
+};
+/**
+ * Opzioni per l'hook useTTS
+ */
+export interface UseTTSOptions {
+  apiUrl?: string;
+  continuousSpeech?: boolean;
+  onEndSpeakStartListen?: () => void;
+  preview?: boolean;
+  disableSpeaker?: boolean;
+}
+// Create our own simplified audio context interface for better typing
+interface SimpleAudioWrapper {
+  currentTime: number;
+  state: 'running' | 'suspended' | 'closed';
+  onstatechange: ((this: AudioContext, ev: Event) => any) | null;
+}
+/**
+ * Hook unificato che gestisce la sintesi vocale
+ */
+export function useTTS(
+  config: TTSConfig,
+  options: UseTTSOptions = {},
+  autoStart: boolean = false,
+  defaultEnableAudio: boolean = true,
+  defaultSpeakerActive: boolean = true
+) {
+  // Stato locale
+  const [isPlaying, setIsPlaying] = useState(false);
+  const [speakerMuted, setSpeakerMuted] = useState(
+    getLocalConfig(
+      'muteSpeaker',
+      !defaultEnableAudio || !defaultSpeakerActive || autoStart
+    )
+  );
+  // Get viseme methods from your context
+  const {
+    addViseme,
+    resetVisemeQueue,
+    startProcessing,
+    stopProcessing,
+  } = useViseme();
+  const [hasUserActivatedSpeak, setHasUserActivatedSpeak] = useState(false);
+  const [error, setError] = useState<Error | null>(null);
+  // Riferimenti
+  const audioRef = useRef<HTMLAudioElement | null>(null);
+  const audioWrapperRef = useRef<SimpleAudioWrapper | null>(null);
+  const globalSpeakRef = useRef<Function | null>(null);
+  const visemeLoadedRef = useRef<boolean>(false);
+  const isSpeakingRef = useRef<boolean>(false);
+  const apiUrl = options.apiUrl || '/api/tts';
+  // Load viseme data into the queue
+  const loadVisemeData = useCallback(
+    (visemeData: VisemeData[]) => {
+      // Make sure we're in a clean state before loading new visemes
+      resetVisemeQueue();
+      visemeLoadedRef.current = false;
+      if (visemeData && visemeData.length > 0) {
+        console.log(`[useTTS] Loading ${visemeData.length} viseme events`);
+        visemeData.forEach(viseme => {
+          addViseme(viseme.visemeId, viseme.audioOffset);
+        });
+        visemeLoadedRef.current = true;
+        return true;
+      } else {
+        console.warn('[useTTS] No viseme data available');
+        return false;
+      }
+    },
+    [addViseme, resetVisemeQueue]
+  );
+  // Create audio wrapper for viseme processing
+  const createAudioWrapper = useCallback(() => {
+    if (!audioRef.current) {
+      console.warn('[useTTS] Cannot create audio wrapper: audio element is null');
+      return null;
+    }
+    // Create a clean wrapper for this audio session
+    const wrapper: SimpleAudioWrapper = {
+      state: 'running',
+      onstatechange: null,
+      get currentTime() {
+        return audioRef.current ? audioRef.current.currentTime : 0;
+      }
+    };
+    // Add event listeners to update the state
+    const handlePause = () => {
+      wrapper.state = 'suspended';
+      if (wrapper.onstatechange) {
+        wrapper.onstatechange.call(null as any, new Event('statechange'));
+      }
+    };
+    const handlePlay = () => {
+      wrapper.state = 'running';
+      if (wrapper.onstatechange) {
+        wrapper.onstatechange.call(null as any, new Event('statechange'));
+      }
+    };
+    const handleEnded = () => {
+      wrapper.state = 'closed';
+      if (wrapper.onstatechange) {
+        wrapper.onstatechange.call(null as any, new Event('statechange'));
+      }
+    };
+    // Attach event listeners to the audio element
+    audioRef.current.addEventListener('pause', handlePause);
+    audioRef.current.addEventListener('play', handlePlay);
+    audioRef.current.addEventListener('ended', handleEnded);
+    // Store cleanup function
+    const cleanupEventListeners = () => {
+      if (audioRef.current) {
+        audioRef.current.removeEventListener('pause', handlePause);
+        audioRef.current.removeEventListener('play', handlePlay);
+        audioRef.current.removeEventListener('ended', handleEnded);
+      }
+    };
+    // Store the cleanup function on the wrapper for later use
+    (wrapper as any).cleanup = cleanupEventListeners;
+    console.log('[useTTS] Created audio wrapper for viseme processing');
+    return wrapper;
+  }, []);
+  /**
+   * Performs a complete cleanup of audio and viseme resources
+   */
+  const cleanup = useCallback(() => {
+    console.log('[useTTS] Cleaning up audio and viseme resources');
+    // First, clean up audio wrapper
+    if (audioWrapperRef.current && (audioWrapperRef.current as any).cleanup) {
+      (audioWrapperRef.current as any).cleanup();
+      console.log('[useTTS] Cleaned up audio wrapper event listeners');
+    }
+    audioWrapperRef.current = null;
+    // Then stop viseme processing
+    stopProcessing();
+    console.log('[useTTS] Stopped viseme processing');
+    // Finally clean up audio resources
+    if (audioRef.current?.src) {
+      URL.revokeObjectURL(audioRef.current.src);
+      console.log('[useTTS] Revoked audio object URL');
+      audioRef.current = null;
+    }
+    // Reset flags
+    visemeLoadedRef.current = false;
+    isSpeakingRef.current = false;
+  }, [stopProcessing]);
+  /**
+   * Stops audio playback and cleans up
+   */
+  const stop = useCallback((): void => {
+    console.log('[useTTS] Stopping audio playback');
+    // Pause audio first
+    if (audioRef.current) {
+      audioRef.current.pause();
+      audioRef.current.currentTime = 0;
+    }
+    // Set UI state
+    setIsPlaying(false);
+    // Clean up all resources
+    cleanup();
+  }, [cleanup]);
+  /**
+   * Emette l'evento di fine riproduzione
+   */
+  const emitEndSpeakEvent = useCallback(() => {
+    console.log('[useTTS] Emitting end speak event');
+    const e = new CustomEvent('MemoriEndSpeak');
+    document.dispatchEvent(e);
+    // Se è impostato il parlato continuo, avvia l'ascolto
+    if (options.continuousSpeech && options.onEndSpeakStartListen) {
+      console.log('[useTTS] Starting continuous speech listening');
+      options.onEndSpeakStartListen();
+    }
+  }, [options.continuousSpeech, options.onEndSpeakStartListen]);
+  /**
+   * Sintetizza il testo in audio e lo riproduce
+   */
+  const speak = useCallback(
+    async (text: string): Promise<void> => {
+      if (isSpeakingRef.current) {
+        return;
+      }
+      if (!text || options.preview || speakerMuted) {
+        emitEndSpeakEvent();
+        return;
+      }
+      isSpeakingRef.current = true;
+      if (!hasUserActivatedSpeak) {
+        setHasUserActivatedSpeak(true);
+      }
+      try {
+        stop();
+        setIsPlaying(true);
+        setError(null);
+        const processedText = sanitizeText(text);
+        const response = await fetch('http://localhost:3000/api/tts', {
+          method: 'POST',
+          headers: {
+            'Content-Type': 'application/json',
+          },
+          body: JSON.stringify({
+            text: processedText,
+            tenant: config.tenant || 'www.aisuru.com',
+            voice: config.voice,
+            model: config.model || 'tts-1',
+            region: config.region,
+            provider: config.provider,
+            includeVisemes: true,
+          }),
+        });
+        if (!response.ok) {
+          const errorData = await response.json().catch(() => ({}));
+          throw new Error(errorData.error || `API error: ${response.status}`);
+        }
+        const visemeDataHeader = response.headers.get('X-Viseme-Data');
+        let hasVisemeData = false;
+        if (visemeDataHeader) {
+          try {
+            const visemeData: VisemeData[] = JSON.parse(visemeDataHeader);
+            hasVisemeData = loadVisemeData(visemeData);
+          } catch (err) {
+            console.error('[useTTS] Error parsing viseme data:', err);
+          }
+        }
+        const audioBlob = await response.blob();
+        const audioUrl = URL.createObjectURL(audioBlob);
+        audioRef.current = new Audio(audioUrl);
+        if (hasVisemeData) {
+          audioWrapperRef.current = createAudioWrapper();
+        }
+        audioRef.current.oncanplaythrough = async () => {
+          try {
+            if (hasVisemeData && audioWrapperRef.current) {
+              startProcessing(audioWrapperRef.current as unknown as IAudioContext);
+            }
+            await audioRef.current?.play();
+            if (audioRef.current) {
+              audioRef.current.oncanplaythrough = null;
+            }
+          } catch (e: any) {
+            cleanup();
+            emitEndSpeakEvent();
+          }
+        };
+        audioRef.current.onended = () => {
+          setIsPlaying(false);
+          isSpeakingRef.current = false;
+          cleanup();
+          emitEndSpeakEvent();
+        };
+        audioRef.current.onerror = () => {
+          setIsPlaying(false);
+          isSpeakingRef.current = false;
+          cleanup();
+          const errorMsg = new Error(`Audio playback failed. This may be due to a network issue or audio format problem.`);
+          setError(errorMsg);
+          emitEndSpeakEvent();
+        };
+        audioRef.current.load();
+      } catch (err) {
+        setIsPlaying(false);
+        isSpeakingRef.current = false;
+        cleanup();
+        const errorMsg = err instanceof Error ? err : new Error(String(err));
+        setError(errorMsg);
+        try {
+          if ('speechSynthesis' in window) {
+            const utterance = new SpeechSynthesisUtterance(sanitizeText(text));
+            window.speechSynthesis.speak(utterance);
+          }
+        } catch (fallbackErr) {
+          console.error('[useTTS] Browser fallback synthesis error:', fallbackErr);
+        }
+        emitEndSpeakEvent();
+      }
+    },
+    [
+      config,
+      speakerMuted,
+      options.preview,
+      hasUserActivatedSpeak,
+      stop,
+      cleanup,
+      loadVisemeData,
+      createAudioWrapper,
+      startProcessing,
+      emitEndSpeakEvent,
+    ]
+  );
+  /**
+   * Imposta lo stato del muto
+   */
+  const toggleMute = useCallback(
+    (mute?: boolean) => {
+      const newMuteState = mute !== undefined ? mute : !speakerMuted;
+      console.log('[useTTS] Toggling mute state to:', newMuteState);
+      setSpeakerMuted(newMuteState);
+      // Se stiamo attivando il muto mentre l'audio sta suonando, fermiamo l'audio
+      if (newMuteState && isPlaying) {
+        stop();
+      }
+    },
+    [speakerMuted, isPlaying, stop]
+  );
+  /**
+   * Aggiorna la variabile globale quando cambia isPlaying
+   */
+  useEffect(() => {
+    console.log('[useTTS] Updating global memoriSpeaking state:', isPlaying);
+    if (typeof window !== 'undefined') {
+      (window as any).memoriSpeaking = isPlaying;
+    }
+  }, [isPlaying]);
+  /**
+   * Hook per esporre la funzione speak globalmente
+   */
+  useEffect(() => {
+    if (typeof window !== 'undefined') {
+      console.log('[useTTS] Setting up global speak function');
+      // Salviamo una referenza alla funzione originale, se esistente
+      globalSpeakRef.current = (window as any).speak;
+      // Assegniamo la nostra funzione
+      (window as any).speak = speak;
+      // Pulizia al dismount
+      return () => {
+        console.log('[useTTS] Cleaning up global speak function');
+        // Ripristiniamo la funzione originale se esisteva
+        (window as any).speak = globalSpeakRef.current;
+      };
+    }
+  }, [speak]);
+  /**
+   * Pulizia delle risorse al dismount
+   */
+  useEffect(() => {
+    return () => {
+      console.log('[useTTS] Component unmounting, cleaning up');
+      stop();
+    };
+  }, [stop]);
+  return {
+    speak,
+    stop,
+    isPlaying,
+    speakerMuted,
+    toggleMute,
+    hasUserActivatedSpeak,
+    setHasUserActivatedSpeak,
+    error,
+    setError,
+  };
+}

package/src/index.tsx CHANGED Viewed

@@ -150,7 +150,7 @@ const Memori: React.FC<Props> = ({
 }) => {
   const [memori, setMemori] = useState<IMemori>();
   const [tenant, setTenant] = useState<Tenant>();
-  const [speechKey, setSpeechKey] = useState<string | undefined>();
+  const [provider, setProvider] = useState<string | undefined>();
   const { t } = useTranslation();
   if (!((memoriID && ownerUserID) || (memoriName && ownerUserName))) {
@@ -162,17 +162,21 @@ const Memori: React.FC<Props> = ({
   const client = memoriApiClient(apiURL, engineURL);
   const fetchSpeechKey = useCallback(async () => {
-    const url =
-      baseURL ||
-      (tenantID.startsWith('https://') ? tenantID : `https://${tenantID}`);
+    const url =  baseURL ||
+       (tenantID.startsWith('https://') ? tenantID : `https://${tenantID}`);
     try {
-      const result = await fetch(`${url}/api/speechkey`);
+      const result = await fetch(`${url}/api/speechkey?tenant=${tenantID}`, {
+        method: 'GET',
+        headers: {
+          'Content-Type': 'application/json',
+        },
+      });
       const data = await result.json();
-      if (data.AZURE_COGNITIVE_SERVICES_TTS_KEY) {
-        setSpeechKey(data.AZURE_COGNITIVE_SERVICES_TTS_KEY);
+      if (data.provider) {
+        setProvider(data.provider);
       } else {
-        console.log('AZURE_COGNITIVE_SERVICES_TTS_KEY not found');
+        console.log('provider not found');
       }
     } catch (error) {
       console.error('Error fetching speech key', error);
@@ -328,7 +332,7 @@ const Memori: React.FC<Props> = ({
             initialContextVars={initialContextVars}
             initialQuestion={initialQuestionLayout}
             authToken={authToken}
-            AZURE_COGNITIVE_SERVICES_TTS_KEY={speechKey}
+            ttsProvider={provider ? provider as 'azure' | 'openai' : 'azure'}
             autoStart={
               autoStart !== undefined
                 ? autoStart
@@ -336,7 +340,7 @@ const Memori: React.FC<Props> = ({
                   ? true
                   : autoStart
             }
-            enableAudio={enableAudio && !!speechKey}
+            enableAudio={enableAudio && !!provider}
             defaultSpeakerActive={defaultSpeakerActive}
             disableTextEnteredEvents={disableTextEnteredEvents}
             onStateChange={onStateChange}