PyPI - dv-pipecat-ai - Versions diffs - 0.0.85.dev821__py3-none-any.whl → 0.0.85.dev822__py3-none-any.whl - Mend

dv-pipecat-ai 0.0.85.dev821py3-none-any.whl → 0.0.85.dev822py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of dv-pipecat-ai might be problematic. Click here for more details.

Files changed (8) hide show

{dv_pipecat_ai-0.0.85.dev821.dist-info → dv_pipecat_ai-0.0.85.dev822.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: dv-pipecat-ai
-Version: 0.0.85.dev821
+Version: 0.0.85.dev822
 Summary: An open source framework for voice (and multimodal) assistants
 License-Expression: BSD-2-Clause
 Project-URL: Source, https://github.com/pipecat-ai/pipecat

{dv_pipecat_ai-0.0.85.dev821.dist-info → dv_pipecat_ai-0.0.85.dev822.dist-info}/RECORD RENAMED Viewed

@@ -1,4 +1,4 @@
-dv_pipecat_ai-0.0.85.dev821.dist-info/licenses/LICENSE,sha256=DWY2QGf2eMCFhuu2ChairtT6CB7BEFffNVhXWc4Od08,1301
+dv_pipecat_ai-0.0.85.dev822.dist-info/licenses/LICENSE,sha256=DWY2QGf2eMCFhuu2ChairtT6CB7BEFffNVhXWc4Od08,1301
 pipecat/__init__.py,sha256=j0Xm6adxHhd7D06dIyyPV_GlBYLlBnTAERVvD_jAARQ,861
 pipecat/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 pipecat/adapters/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
@@ -79,7 +79,7 @@ pipecat/extensions/voicemail/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NM
 pipecat/extensions/voicemail/voicemail_detector.py,sha256=JxmU2752iWP_1_GmzZReNESUTFAeyEa4XBPL20_C208,30004
 pipecat/frames/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 pipecat/frames/frames.proto,sha256=JXZm3VXLR8zMOUcOuhVoe2mhM3MQIQGMJXLopdJO_5Y,839
-pipecat/frames/frames.py,sha256=_GbvjOe1HRDSVCTqF5nvRaA-oCFrtyWfl457Uq0qkGw,49229
+pipecat/frames/frames.py,sha256=CxlrFst5DuD6kDp2CE6kWigVezF94y-Snf6h8w1pwVU,49522
 pipecat/frames/protobufs/frames_pb2.py,sha256=VHgGV_W7qQ4sfQK6RHb5_DggLm3PiSYMr6aBZ8_p1cQ,2590
 pipecat/metrics/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 pipecat/metrics/metrics.py,sha256=bdZNciEtLTtA-xgoKDz2RJAy6fKrXkTwz3pryVHzc2M,2713
@@ -113,7 +113,7 @@ pipecat/processors/idle_frame_processor.py,sha256=z8AuhGap61lA5K35P6XCaOpn4kkmK_
 pipecat/processors/logger.py,sha256=8xa4KKekXQIETlQR7zoGnwUpLNo8CeDVm7YjyXePN-w,2385
 pipecat/processors/producer_processor.py,sha256=iIIOHZd77APvUGP7JqFbznAHUnCULcq_qYiSEjwXHcc,3265
 pipecat/processors/text_transformer.py,sha256=LnfWJYzntJhZhrQ1lgSSY4D4VbHtrQJgrC227M69ZYU,1718
-pipecat/processors/transcript_processor.py,sha256=9F00tY3cxt63ZhYvFGSSAnuUTt3J16mEOUHMzIMndMY,11720
+pipecat/processors/transcript_processor.py,sha256=fr5JtlTOfmKnfmYG8ZwRj4DpZWP-uuGi6aNNKtlLxRg,12491
 pipecat/processors/two_stage_user_idle_processor.py,sha256=uf2aZh_lfW-eMxmFogP3R4taAJ1yXOSqjKsR7oXtD0Y,2938
 pipecat/processors/user_idle_processor.py,sha256=Dl-Kcg0B4JZqWXXiyGuvYszGimbu2oKOyOJC92R9_hE,9140
 pipecat/processors/aggregators/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
@@ -122,7 +122,7 @@ pipecat/processors/aggregators/gated.py,sha256=tii0sRrBkRW6y9Xq5iTWPnqlOEejU4VqP
 pipecat/processors/aggregators/gated_llm_context.py,sha256=CPv6sMA8irD1zZ3fU1gSv6D7qcPvCA0MdpFhBtJ_ekI,3007
 pipecat/processors/aggregators/gated_open_ai_llm_context.py,sha256=DgqmdPj1u3fP_SVmxtfP7NjHqnyhN_RVVTDfmjbkxAs,361
 pipecat/processors/aggregators/llm_context.py,sha256=wNbZA0Vt0FzNc5cu06xiv1z7DIClIlfqR1ZD8EusbVw,11085
-pipecat/processors/aggregators/llm_response.py,sha256=igjIcBwzXzULWQIzM6XxXlXCHbR4Q5tAHP8PBHaPVNQ,47314
+pipecat/processors/aggregators/llm_response.py,sha256=cBNGU8Ld4zT36-QsE1EJemrNA12q7lc9i-vLM9qmLcQ,48075
 pipecat/processors/aggregators/llm_response_universal.py,sha256=5PqmpATpekD8BVWyBExZgatKHsNbZem8M-A7_VwTbiQ,34334
 pipecat/processors/aggregators/openai_llm_context.py,sha256=cC8DXdVPERRN04i0i-1Ys6kusvnbMALeH-Z8Pu5K684,12999
 pipecat/processors/aggregators/sentence.py,sha256=E7e3knfQl6HEGpYMKPklF1aO_gOn-rr7SnynErwfkQk,2235
@@ -415,7 +415,7 @@ pipecat/utils/tracing/service_decorators.py,sha256=fwzxFpi8DJl6BJbK74G0UEB4ccMJg
 pipecat/utils/tracing/setup.py,sha256=7TEgPNpq6M8lww8OQvf0P9FzYc5A30xICGklVA-fua0,2892
 pipecat/utils/tracing/turn_context_provider.py,sha256=ikon3plFOx0XbMrH6DdeHttNpb-U0gzMZIm3bWLc9eI,2485
 pipecat/utils/tracing/turn_trace_observer.py,sha256=dma16SBJpYSOE58YDWy89QzHyQFc_9gQZszKeWixuwc,9725
-dv_pipecat_ai-0.0.85.dev821.dist-info/METADATA,sha256=mkEkQu0dIz-W8gqGGXsrqlfcD_AzqceP8-vCK0UgMfY,32924
-dv_pipecat_ai-0.0.85.dev821.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
-dv_pipecat_ai-0.0.85.dev821.dist-info/top_level.txt,sha256=kQzG20CxGf-nSsHmtXHx3hY2-8zHA3jYg8jk0TajqXc,8
-dv_pipecat_ai-0.0.85.dev821.dist-info/RECORD,,
+dv_pipecat_ai-0.0.85.dev822.dist-info/METADATA,sha256=32ww2Lem8OVrVN8fSto1BPjfW5dXjPi4fS9Me8Zz-YE,32924
+dv_pipecat_ai-0.0.85.dev822.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
+dv_pipecat_ai-0.0.85.dev822.dist-info/top_level.txt,sha256=kQzG20CxGf-nSsHmtXHx3hY2-8zHA3jYg8jk0TajqXc,8
+dv_pipecat_ai-0.0.85.dev822.dist-info/RECORD,,

pipecat/frames/frames.py CHANGED Viewed

@@ -457,6 +457,7 @@ class TranscriptionMessage:
     content: str
     user_id: Optional[str] = None
     timestamp: Optional[str] = None
+    message_id: Optional[int] = None
 @dataclass
@@ -510,6 +511,17 @@ class TranscriptionUpdateFrame(DataFrame):
         return f"{self.name}(pts: {pts}, messages: {len(self.messages)})"
+@dataclass
+class TranscriptDropFrame(DataFrame):
+    """Frame indicating previously emitted transcript chunks should be discarded.
+    Parameters:
+        transcript_ids: List of frame/message identifiers to drop.
+    """
+    transcript_ids: List[int]
 @dataclass
 class LLMContextFrame(Frame):
     """Frame containing a universal LLM context.

pipecat/processors/aggregators/llm_response.py CHANGED Viewed

@@ -48,9 +48,10 @@ from pipecat.frames.frames import (
     LLMTextFrame,
     OpenAILLMContextAssistantTimestampFrame,
     SpeechControlParamsFrame,
-    StartInterruptionFrame,
     StartFrame,
+    StartInterruptionFrame,
     TextFrame,
+    TranscriptDropFrame,
     TranscriptionFrame,
     UserImageRawFrame,
     UserStartedSpeakingFrame,
@@ -446,6 +447,7 @@ class LLMUserContextAggregator(LLMContextResponseAggregator):
         self._latest_final_transcript = ""
         self._last_user_speaking_time = 0
         self._last_aggregation_push_time = 0
+        self._pending_transcription_ids: List[int] = []
     async def reset(self):
         """Reset the aggregation state and interruption strategies."""
@@ -453,6 +455,7 @@ class LLMUserContextAggregator(LLMContextResponseAggregator):
         self._was_bot_speaking = False
         self._seen_interim_results = False
         self._waiting_for_aggregation = False
+        self._pending_transcription_ids.clear()
         [await s.reset() for s in self._interruption_strategies]
     async def handle_aggregation(self, aggregation: str):
@@ -588,6 +591,17 @@ class LLMUserContextAggregator(LLMContextResponseAggregator):
         return any([await should_interrupt(s) for s in self._interruption_strategies])
+    async def _discard_pending_transcriptions(self, reason: str):
+        """Notify upstream processors that pending transcripts should be dropped."""
+        if self._pending_transcription_ids:
+            drop_frame = TranscriptDropFrame(transcript_ids=list(self._pending_transcription_ids))
+            self.logger.debug(
+                f"Dropping {len(self._pending_transcription_ids)} transcript chunk(s) due to {reason}"
+            )
+            await self.push_frame(drop_frame, FrameDirection.UPSTREAM)
+        self._pending_transcription_ids.clear()
+        self._aggregation = ""
     async def _start(self, frame: StartFrame):
         self._create_aggregation_task()
@@ -616,8 +630,7 @@ class LLMUserContextAggregator(LLMContextResponseAggregator):
     async def _handle_user_started_speaking(self, frame: UserStartedSpeakingFrame):
         if len(self._aggregation) > 0:
-            self.logger.debug(f"Dropping {self._aggregation}")
-            self._aggregation = ""
+            await self._discard_pending_transcriptions("user_started_speaking")
         self._latest_final_transcript = ""
         self._last_user_speaking_time = time.time()
         self._user_speaking = True
@@ -662,6 +675,7 @@ class LLMUserContextAggregator(LLMContextResponseAggregator):
             return
         self._aggregation += f" {text}" if self._aggregation else text
+        self._pending_transcription_ids.append(frame.id)
         # We just got a final result, so let's reset interim results.
         self._seen_interim_results = False

pipecat/processors/transcript_processor.py CHANGED Viewed

@@ -20,6 +20,7 @@ from pipecat.frames.frames import (
     EndFrame,
     Frame,
     InterruptionFrame,
+    TranscriptDropFrame,
     TranscriptionFrame,
     TranscriptionMessage,
     TranscriptionUpdateFrame,
@@ -44,6 +45,7 @@ class BaseTranscriptProcessor(FrameProcessor):
         super().__init__(**kwargs)
         self._processed_messages: List[TranscriptionMessage] = []
         self._register_event_handler("on_transcript_update")
+        self._register_event_handler("on_transcript_drop")
     async def _emit_update(self, messages: List[TranscriptionMessage]):
         """Emit transcript updates for new messages.
@@ -57,6 +59,18 @@ class BaseTranscriptProcessor(FrameProcessor):
             await self._call_event_handler("on_transcript_update", update_frame)
             await self.push_frame(update_frame)
+    async def _handle_transcript_drop(self, frame: TranscriptDropFrame):
+        """Handle transcript drop notifications by removing stored messages."""
+        if not frame.transcript_ids:
+            return
+        drop_ids = set(frame.transcript_ids)
+        if drop_ids:
+            self._processed_messages = [
+                msg for msg in self._processed_messages if msg.message_id not in drop_ids
+            ]
+            await self._call_event_handler("on_transcript_drop", frame)
 class UserTranscriptProcessor(BaseTranscriptProcessor):
     """Processes user transcription frames into timestamped conversation messages."""
@@ -72,9 +86,15 @@ class UserTranscriptProcessor(BaseTranscriptProcessor):
         if isinstance(frame, TranscriptionFrame):
             message = TranscriptionMessage(
-                role="user", user_id=frame.user_id, content=frame.text, timestamp=frame.timestamp
+                role="user",
+                user_id=frame.user_id,
+                content=frame.text,
+                timestamp=frame.timestamp,
+                message_id=frame.id,
             )
             await self._emit_update([message])
+        elif isinstance(frame, TranscriptDropFrame):
+            await self._handle_transcript_drop(frame)
         await self.push_frame(frame, direction)

{dv_pipecat_ai-0.0.85.dev821.dist-info → dv_pipecat_ai-0.0.85.dev822.dist-info}/WHEEL RENAMED Viewed

File without changes

{dv_pipecat_ai-0.0.85.dev821.dist-info → dv_pipecat_ai-0.0.85.dev822.dist-info}/licenses/LICENSE RENAMED Viewed

File without changes

{dv_pipecat_ai-0.0.85.dev821.dist-info → dv_pipecat_ai-0.0.85.dev822.dist-info}/top_level.txt RENAMED Viewed

File without changes

dv-pipecat-ai 0.0.85.dev821__py3-none-any.whl → 0.0.85.dev822__py3-none-any.whl

Potentially problematic release.

dv-pipecat-ai 0.0.85.dev821py3-none-any.whl → 0.0.85.dev822py3-none-any.whl