npm - @copilotz/chat-ui - Versions diffs - 0.1.33 → 0.1.34 - Mend

@copilotz/chat-ui 0.1.33 → 0.1.34

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (5) hide show

package/dist/index.cjs CHANGED Viewed

@@ -101,7 +101,7 @@ var defaultChatConfig = {
     voiceSendNow: "Send now",
     voiceCancel: "Cancel",
     voiceDiscard: "Delete recording",
-    voiceRecordAgain: "Record again",
+    voiceRecordAgain: "Continue recording",
     voiceAutoSendIn: "Auto-sends in {{seconds}}s",
     voiceTranscriptPending: "Transcript unavailable",
     voicePermissionDenied: "Microphone access was denied.",
@@ -2866,6 +2866,121 @@ var blobToDataUrl = (blob) => new Promise((resolve, reject) => {
   reader.onerror = () => reject(reader.error ?? new Error("Failed to read recorded audio"));
   reader.readAsDataURL(blob);
 });
+var joinTranscriptParts = (...parts) => {
+  const value = parts.map((part) => part?.trim()).filter((part) => Boolean(part && part.length > 0)).join(" ").trim();
+  return value.length > 0 ? value : void 0;
+};
+var getAudioContextCtor = () => globalThis.AudioContext || globalThis.webkitAudioContext;
+var getOfflineAudioContextCtor = () => globalThis.OfflineAudioContext || globalThis.webkitOfflineAudioContext;
+var attachmentToArrayBuffer = async (attachment) => {
+  const response = await fetch(attachment.dataUrl);
+  return response.arrayBuffer();
+};
+var decodeAudioAttachment = async (attachment) => {
+  const AudioContextCtor = getAudioContextCtor();
+  if (!AudioContextCtor) {
+    throw new Error("Audio decoding is not supported in this browser");
+  }
+  const audioContext = new AudioContextCtor();
+  try {
+    const arrayBuffer = await attachmentToArrayBuffer(attachment);
+    return await audioContext.decodeAudioData(arrayBuffer.slice(0));
+  } finally {
+    await closeAudioContext(audioContext);
+  }
+};
+var renderMergedBuffer = async (buffers) => {
+  const OfflineAudioContextCtor = getOfflineAudioContextCtor();
+  if (!OfflineAudioContextCtor) {
+    throw new Error("Offline audio rendering is not supported in this browser");
+  }
+  const numberOfChannels = Math.max(...buffers.map((buffer) => buffer.numberOfChannels));
+  const sampleRate = Math.max(...buffers.map((buffer) => buffer.sampleRate));
+  const totalFrames = Math.max(1, Math.ceil(buffers.reduce((sum, buffer) => sum + buffer.duration * sampleRate, 0)));
+  const offlineContext = new OfflineAudioContextCtor(numberOfChannels, totalFrames, sampleRate);
+  let offsetSeconds = 0;
+  for (const buffer of buffers) {
+    const source = offlineContext.createBufferSource();
+    source.buffer = buffer;
+    source.connect(offlineContext.destination);
+    source.start(offsetSeconds);
+    offsetSeconds += buffer.duration;
+  }
+  return offlineContext.startRendering();
+};
+var encodeWav = (audioBuffer) => {
+  const numberOfChannels = audioBuffer.numberOfChannels;
+  const sampleRate = audioBuffer.sampleRate;
+  const bitsPerSample = 16;
+  const bytesPerSample = bitsPerSample / 8;
+  const dataLength = audioBuffer.length * numberOfChannels * bytesPerSample;
+  const buffer = new ArrayBuffer(44 + dataLength);
+  const view = new DataView(buffer);
+  const writeString = (offset2, value) => {
+    for (let index = 0; index < value.length; index += 1) {
+      view.setUint8(offset2 + index, value.charCodeAt(index));
+    }
+  };
+  writeString(0, "RIFF");
+  view.setUint32(4, 36 + dataLength, true);
+  writeString(8, "WAVE");
+  writeString(12, "fmt ");
+  view.setUint32(16, 16, true);
+  view.setUint16(20, 1, true);
+  view.setUint16(22, numberOfChannels, true);
+  view.setUint32(24, sampleRate, true);
+  view.setUint32(28, sampleRate * numberOfChannels * bytesPerSample, true);
+  view.setUint16(32, numberOfChannels * bytesPerSample, true);
+  view.setUint16(34, bitsPerSample, true);
+  writeString(36, "data");
+  view.setUint32(40, dataLength, true);
+  let offset = 44;
+  const channelData = Array.from({ length: numberOfChannels }, (_, index) => audioBuffer.getChannelData(index));
+  for (let sampleIndex = 0; sampleIndex < audioBuffer.length; sampleIndex += 1) {
+    for (let channelIndex = 0; channelIndex < numberOfChannels; channelIndex += 1) {
+      const sample = Math.max(-1, Math.min(1, channelData[channelIndex][sampleIndex]));
+      const pcmValue = sample < 0 ? sample * 32768 : sample * 32767;
+      view.setInt16(offset, pcmValue, true);
+      offset += 2;
+    }
+  }
+  return new Blob([buffer], { type: "audio/wav" });
+};
+var resolveSegmentCount = (segment) => {
+  const candidate = segment?.metadata?.segmentCount;
+  return typeof candidate === "number" && Number.isFinite(candidate) && candidate > 0 ? candidate : segment ? 1 : 0;
+};
+var mergeVoiceTranscripts = (previous, incoming) => ({
+  final: joinTranscriptParts(previous?.final, incoming?.final),
+  partial: joinTranscriptParts(previous?.final, incoming?.partial)
+});
+var appendVoiceSegments = async (previous, incoming) => {
+  const [previousBuffer, incomingBuffer] = await Promise.all([
+    decodeAudioAttachment(previous.attachment),
+    decodeAudioAttachment(incoming.attachment)
+  ]);
+  const mergedBuffer = await renderMergedBuffer([previousBuffer, incomingBuffer]);
+  const mergedBlob = encodeWav(mergedBuffer);
+  const dataUrl = await blobToDataUrl(mergedBlob);
+  const segmentCount = resolveSegmentCount(previous) + resolveSegmentCount(incoming);
+  return {
+    attachment: {
+      kind: "audio",
+      dataUrl,
+      mimeType: mergedBlob.type,
+      durationMs: Math.round(mergedBuffer.duration * 1e3),
+      fileName: `voice-${(/* @__PURE__ */ new Date()).toISOString().replace(/[:.]/g, "-")}.wav`,
+      size: mergedBlob.size
+    },
+    transcript: mergeVoiceTranscripts(previous.transcript, incoming.transcript),
+    metadata: {
+      ...previous.metadata,
+      ...incoming.metadata,
+      segmentCount,
+      source: segmentCount > 1 ? "merged" : incoming.metadata?.source ?? previous.metadata?.source
+    }
+  };
+};
 var stopStream = (stream) => {
   if (!stream) return;
   stream.getTracks().forEach((track) => track.stop());
@@ -2987,7 +3102,7 @@ var createManualVoiceProvider = async (handlers, options = {}) => {
                 fileName: `voice-${(/* @__PURE__ */ new Date()).toISOString().replace(/[:.]/g, "-")}.webm`,
                 size: blob.size
               },
-              metadata: { source: "manual" }
+              metadata: { source: "manual", segmentCount: 1 }
             });
           } else {
             handlers.onStateChange?.("idle");
@@ -3254,7 +3369,7 @@ var VoiceComposer = ({
         ] })
       ] })
     ] }),
-    state === "error" && errorMessage && /* @__PURE__ */ (0, import_jsx_runtime21.jsx)("div", { className: "mt-3 rounded-lg border border-destructive/30 bg-destructive/5 px-3 py-2 text-sm text-destructive", children: errorMessage })
+    errorMessage && /* @__PURE__ */ (0, import_jsx_runtime21.jsx)("div", { className: "mt-3 rounded-lg border border-destructive/30 bg-destructive/5 px-3 py-2 text-sm text-destructive", children: errorMessage })
   ] });
 };
@@ -3503,6 +3618,7 @@ var resolveVoiceErrorMessage = (error, config) => {
   return config?.labels?.voiceCaptureError || "Unable to capture audio.";
 };
 var clearVoiceTranscript = () => ({});
+var resolveVoiceSegmentDuration = (segment) => segment.attachment.durationMs ?? 0;
 var ChatInput = (0, import_react5.memo)(function ChatInput2({
   value,
   onChange,
@@ -3551,6 +3667,9 @@ var ChatInput = (0, import_react5.memo)(function ChatInput2({
   const recordingInterval = (0, import_react5.useRef)(null);
   const mediaStreamRef = (0, import_react5.useRef)(null);
   const voiceProviderRef = (0, import_react5.useRef)(null);
+  const voiceDraftRef = (0, import_react5.useRef)(null);
+  const voiceAppendBaseRef = (0, import_react5.useRef)(null);
+  const voiceAppendBaseDurationRef = (0, import_react5.useRef)(0);
   (0, import_react5.useEffect)(() => {
     return () => {
       if (mediaStreamRef.current) {
@@ -3565,6 +3684,9 @@ var ChatInput = (0, import_react5.memo)(function ChatInput2({
       }
     };
   }, []);
+  (0, import_react5.useEffect)(() => {
+    voiceDraftRef.current = voiceDraft;
+  }, [voiceDraft]);
   const handleSubmit = (e) => {
     e.preventDefault();
     if (!value.trim() && attachments.length === 0 || disabled || isGenerating) return;
@@ -3742,6 +3864,9 @@ var ChatInput = (0, import_react5.memo)(function ChatInput2({
   const resetVoiceComposerState = (0, import_react5.useCallback)((nextState = "idle") => {
     setVoiceState(nextState);
     setVoiceDraft(null);
+    voiceDraftRef.current = null;
+    voiceAppendBaseRef.current = null;
+    voiceAppendBaseDurationRef.current = 0;
     setVoiceTranscript(clearVoiceTranscript());
     setVoiceDurationMs(0);
     setVoiceAudioLevel(0);
@@ -3757,23 +3882,76 @@ var ChatInput = (0, import_react5.memo)(function ChatInput2({
     const provider = await createProvider({
       onStateChange: setVoiceState,
       onAudioLevelChange: setVoiceAudioLevel,
-      onDurationChange: setVoiceDurationMs,
-      onTranscriptChange: setVoiceTranscript,
+      onDurationChange: (durationMs) => {
+        setVoiceDurationMs(voiceAppendBaseDurationRef.current + durationMs);
+      },
+      onTranscriptChange: (transcript) => {
+        const baseTranscript = voiceAppendBaseRef.current?.transcript;
+        setVoiceTranscript(
+          baseTranscript ? mergeVoiceTranscripts(baseTranscript, transcript) : transcript
+        );
+      },
       onSegmentReady: (segment) => {
-        setVoiceDraft(segment);
-        setVoiceTranscript(segment.transcript ?? clearVoiceTranscript());
-        setVoiceDurationMs(segment.attachment.durationMs ?? 0);
-        setVoiceAudioLevel(0);
-        setVoiceCountdownMs(voiceAutoSendDelayMs);
-        setIsVoiceAutoSendActive(voiceAutoSendDelayMs > 0);
-        setVoiceError(null);
-        setVoiceState("review");
+        void (async () => {
+          const previousSegment = voiceAppendBaseRef.current;
+          try {
+            const nextSegment = previousSegment ? await appendVoiceSegments(previousSegment, segment) : segment;
+            voiceAppendBaseRef.current = null;
+            voiceAppendBaseDurationRef.current = 0;
+            voiceDraftRef.current = nextSegment;
+            setVoiceDraft(nextSegment);
+            setVoiceTranscript(nextSegment.transcript ?? clearVoiceTranscript());
+            setVoiceDurationMs(resolveVoiceSegmentDuration(nextSegment));
+            setVoiceAudioLevel(0);
+            setVoiceCountdownMs(voiceAutoSendDelayMs);
+            setIsVoiceAutoSendActive(voiceAutoSendDelayMs > 0);
+            setVoiceError(null);
+            setVoiceState("review");
+          } catch (error) {
+            const resolvedError = resolveVoiceErrorMessage(error, config);
+            voiceAppendBaseRef.current = null;
+            voiceAppendBaseDurationRef.current = 0;
+            setVoiceAudioLevel(0);
+            setVoiceCountdownMs(0);
+            setIsVoiceAutoSendActive(false);
+            if (previousSegment) {
+              voiceDraftRef.current = previousSegment;
+              setVoiceDraft(previousSegment);
+              setVoiceTranscript(previousSegment.transcript ?? clearVoiceTranscript());
+              setVoiceDurationMs(resolveVoiceSegmentDuration(previousSegment));
+              setVoiceError(resolvedError);
+              setVoiceState("review");
+              return;
+            }
+            voiceDraftRef.current = null;
+            setVoiceDraft(null);
+            setVoiceTranscript(clearVoiceTranscript());
+            setVoiceDurationMs(0);
+            setVoiceError(resolvedError);
+            setVoiceState("error");
+          }
+        })();
       },
       onError: (error) => {
+        const previousSegment = voiceAppendBaseRef.current;
+        voiceAppendBaseRef.current = null;
+        voiceAppendBaseDurationRef.current = 0;
         setVoiceError(resolveVoiceErrorMessage(error, config));
         setVoiceAudioLevel(0);
         setVoiceCountdownMs(0);
         setIsVoiceAutoSendActive(false);
+        if (previousSegment) {
+          voiceDraftRef.current = previousSegment;
+          setVoiceDraft(previousSegment);
+          setVoiceTranscript(previousSegment.transcript ?? clearVoiceTranscript());
+          setVoiceDurationMs(resolveVoiceSegmentDuration(previousSegment));
+          setVoiceState("review");
+          return;
+        }
+        voiceDraftRef.current = null;
+        setVoiceDraft(null);
+        setVoiceTranscript(clearVoiceTranscript());
+        setVoiceDurationMs(0);
         setVoiceState("error");
       }
     }, {
@@ -3783,35 +3961,67 @@ var ChatInput = (0, import_react5.memo)(function ChatInput2({
     return provider;
   }, [config, voiceAutoSendDelayMs, voiceMaxRecordingMs]);
   const closeVoiceComposer = (0, import_react5.useCallback)(async () => {
+    voiceAppendBaseRef.current = null;
+    voiceAppendBaseDurationRef.current = 0;
     setIsVoiceComposerOpen(false);
     setVoiceError(null);
     setVoiceCountdownMs(0);
     setVoiceAudioLevel(0);
     setVoiceTranscript(clearVoiceTranscript());
     setVoiceDraft(null);
+    voiceDraftRef.current = null;
     setVoiceDurationMs(0);
     setVoiceState("idle");
     if (voiceProviderRef.current) {
       await voiceProviderRef.current.cancel();
     }
   }, []);
-  const startVoiceCapture = (0, import_react5.useCallback)(async () => {
+  const startVoiceCapture = (0, import_react5.useCallback)(async (appendToDraft = false) => {
     if (disabled || isGenerating) {
       return;
     }
+    const previousDraft = appendToDraft ? voiceDraftRef.current : null;
+    const previousDurationMs = previousDraft ? resolveVoiceSegmentDuration(previousDraft) : 0;
     setIsVoiceComposerOpen(true);
     setVoiceError(null);
-    setVoiceDraft(null);
     setVoiceCountdownMs(0);
-    setVoiceTranscript(clearVoiceTranscript());
     setVoiceAudioLevel(0);
-    setVoiceDurationMs(0);
     setIsVoiceAutoSendActive(false);
+    voiceAppendBaseRef.current = previousDraft;
+    voiceAppendBaseDurationRef.current = previousDurationMs;
+    if (!previousDraft) {
+      setVoiceDraft(null);
+      voiceDraftRef.current = null;
+      setVoiceTranscript(clearVoiceTranscript());
+      setVoiceDurationMs(0);
+    } else {
+      setVoiceTranscript(previousDraft.transcript ?? clearVoiceTranscript());
+      setVoiceDurationMs(previousDurationMs);
+    }
     try {
       const provider = await ensureVoiceProvider();
       await provider.start();
     } catch (error) {
-      setVoiceError(resolveVoiceErrorMessage(error, config));
+      const resolvedError = resolveVoiceErrorMessage(error, config);
+      voiceAppendBaseRef.current = null;
+      voiceAppendBaseDurationRef.current = 0;
+      setVoiceAudioLevel(0);
+      setVoiceCountdownMs(0);
+      setIsVoiceAutoSendActive(false);
+      if (previousDraft) {
+        voiceDraftRef.current = previousDraft;
+        setVoiceDraft(previousDraft);
+        setVoiceTranscript(previousDraft.transcript ?? clearVoiceTranscript());
+        setVoiceDurationMs(previousDurationMs);
+        setVoiceError(resolvedError);
+        setVoiceState("review");
+        return;
+      }
+      voiceDraftRef.current = null;
+      setVoiceDraft(null);
+      setVoiceTranscript(clearVoiceTranscript());
+      setVoiceDurationMs(0);
+      setVoiceError(resolvedError);
       setVoiceState("error");
     }
   }, [disabled, isGenerating, ensureVoiceProvider, config]);
@@ -3825,6 +4035,8 @@ var ChatInput = (0, import_react5.memo)(function ChatInput2({
     }
   }, [config]);
   const cancelVoiceCapture = (0, import_react5.useCallback)(async () => {
+    voiceAppendBaseRef.current = null;
+    voiceAppendBaseDurationRef.current = 0;
     if (voiceProviderRef.current) {
       await voiceProviderRef.current.cancel();
     }
@@ -3949,7 +4161,7 @@ var ChatInput = (0, import_react5.memo)(function ChatInput2({
           void cancelVoiceCapture();
         },
         onRecordAgain: () => {
-          void startVoiceCapture();
+          void startVoiceCapture(true);
         },
         onSendNow: sendVoiceDraft,
         onExit: () => {