PyPI - dv-pipecat-ai - Versions diffs - 0.0.85.dev821__py3-none-any.whl → 0.0.85.dev823__py3-none-any.whl - Mend

dv-pipecat-ai 0.0.85.dev821py3-none-any.whl → 0.0.85.dev823py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of dv-pipecat-ai might be problematic. Click here for more details.

Files changed (9) hide show

{dv_pipecat_ai-0.0.85.dev821.dist-info → dv_pipecat_ai-0.0.85.dev823.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: dv-pipecat-ai
-Version: 0.0.85.dev821
+Version: 0.0.85.dev823
 Summary: An open source framework for voice (and multimodal) assistants
 License-Expression: BSD-2-Clause
 Project-URL: Source, https://github.com/pipecat-ai/pipecat

{dv_pipecat_ai-0.0.85.dev821.dist-info → dv_pipecat_ai-0.0.85.dev823.dist-info}/RECORD RENAMED Viewed

@@ -1,4 +1,4 @@
-dv_pipecat_ai-0.0.85.dev821.dist-info/licenses/LICENSE,sha256=DWY2QGf2eMCFhuu2ChairtT6CB7BEFffNVhXWc4Od08,1301
+dv_pipecat_ai-0.0.85.dev823.dist-info/licenses/LICENSE,sha256=DWY2QGf2eMCFhuu2ChairtT6CB7BEFffNVhXWc4Od08,1301
 pipecat/__init__.py,sha256=j0Xm6adxHhd7D06dIyyPV_GlBYLlBnTAERVvD_jAARQ,861
 pipecat/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 pipecat/adapters/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
@@ -79,7 +79,7 @@ pipecat/extensions/voicemail/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NM
 pipecat/extensions/voicemail/voicemail_detector.py,sha256=JxmU2752iWP_1_GmzZReNESUTFAeyEa4XBPL20_C208,30004
 pipecat/frames/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 pipecat/frames/frames.proto,sha256=JXZm3VXLR8zMOUcOuhVoe2mhM3MQIQGMJXLopdJO_5Y,839
-pipecat/frames/frames.py,sha256=_GbvjOe1HRDSVCTqF5nvRaA-oCFrtyWfl457Uq0qkGw,49229
+pipecat/frames/frames.py,sha256=CxlrFst5DuD6kDp2CE6kWigVezF94y-Snf6h8w1pwVU,49522
 pipecat/frames/protobufs/frames_pb2.py,sha256=VHgGV_W7qQ4sfQK6RHb5_DggLm3PiSYMr6aBZ8_p1cQ,2590
 pipecat/metrics/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 pipecat/metrics/metrics.py,sha256=bdZNciEtLTtA-xgoKDz2RJAy6fKrXkTwz3pryVHzc2M,2713
@@ -108,12 +108,12 @@ pipecat/processors/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuF
 pipecat/processors/async_generator.py,sha256=qPOZxk5eOad_NrF_Z06vWZ6deXIxb9AKZKYO2e5pkJs,2385
 pipecat/processors/consumer_processor.py,sha256=DrWCKnfblknZJ0bLmR_unIeJ1axQw4IPUn2IB3KLGGA,3228
 pipecat/processors/dtmf_aggregator.py,sha256=mo_IXUlsnVl-_Xn8sbTGnRF4Lkts0h6E3uauGbeFyWs,10204
-pipecat/processors/frame_processor.py,sha256=Qf-EJCWlw2itvJTsFykKBfjcsXRQUDgSqJDF8gb60V0,33806
+pipecat/processors/frame_processor.py,sha256=uBu6Waa0_diMXdQXMZ5V5a_KwaaPzcieyuv5gO9u-ME,33841
 pipecat/processors/idle_frame_processor.py,sha256=z8AuhGap61lA5K35P6XCaOpn4kkmK_9NZNppbpQxheU,3124
 pipecat/processors/logger.py,sha256=8xa4KKekXQIETlQR7zoGnwUpLNo8CeDVm7YjyXePN-w,2385
 pipecat/processors/producer_processor.py,sha256=iIIOHZd77APvUGP7JqFbznAHUnCULcq_qYiSEjwXHcc,3265
 pipecat/processors/text_transformer.py,sha256=LnfWJYzntJhZhrQ1lgSSY4D4VbHtrQJgrC227M69ZYU,1718
-pipecat/processors/transcript_processor.py,sha256=9F00tY3cxt63ZhYvFGSSAnuUTt3J16mEOUHMzIMndMY,11720
+pipecat/processors/transcript_processor.py,sha256=fr5JtlTOfmKnfmYG8ZwRj4DpZWP-uuGi6aNNKtlLxRg,12491
 pipecat/processors/two_stage_user_idle_processor.py,sha256=uf2aZh_lfW-eMxmFogP3R4taAJ1yXOSqjKsR7oXtD0Y,2938
 pipecat/processors/user_idle_processor.py,sha256=Dl-Kcg0B4JZqWXXiyGuvYszGimbu2oKOyOJC92R9_hE,9140
 pipecat/processors/aggregators/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
@@ -122,7 +122,7 @@ pipecat/processors/aggregators/gated.py,sha256=tii0sRrBkRW6y9Xq5iTWPnqlOEejU4VqP
 pipecat/processors/aggregators/gated_llm_context.py,sha256=CPv6sMA8irD1zZ3fU1gSv6D7qcPvCA0MdpFhBtJ_ekI,3007
 pipecat/processors/aggregators/gated_open_ai_llm_context.py,sha256=DgqmdPj1u3fP_SVmxtfP7NjHqnyhN_RVVTDfmjbkxAs,361
 pipecat/processors/aggregators/llm_context.py,sha256=wNbZA0Vt0FzNc5cu06xiv1z7DIClIlfqR1ZD8EusbVw,11085
-pipecat/processors/aggregators/llm_response.py,sha256=igjIcBwzXzULWQIzM6XxXlXCHbR4Q5tAHP8PBHaPVNQ,47314
+pipecat/processors/aggregators/llm_response.py,sha256=cBNGU8Ld4zT36-QsE1EJemrNA12q7lc9i-vLM9qmLcQ,48075
 pipecat/processors/aggregators/llm_response_universal.py,sha256=5PqmpATpekD8BVWyBExZgatKHsNbZem8M-A7_VwTbiQ,34334
 pipecat/processors/aggregators/openai_llm_context.py,sha256=cC8DXdVPERRN04i0i-1Ys6kusvnbMALeH-Z8Pu5K684,12999
 pipecat/processors/aggregators/sentence.py,sha256=E7e3knfQl6HEGpYMKPklF1aO_gOn-rr7SnynErwfkQk,2235
@@ -415,7 +415,7 @@ pipecat/utils/tracing/service_decorators.py,sha256=fwzxFpi8DJl6BJbK74G0UEB4ccMJg
 pipecat/utils/tracing/setup.py,sha256=7TEgPNpq6M8lww8OQvf0P9FzYc5A30xICGklVA-fua0,2892
 pipecat/utils/tracing/turn_context_provider.py,sha256=ikon3plFOx0XbMrH6DdeHttNpb-U0gzMZIm3bWLc9eI,2485
 pipecat/utils/tracing/turn_trace_observer.py,sha256=dma16SBJpYSOE58YDWy89QzHyQFc_9gQZszKeWixuwc,9725
-dv_pipecat_ai-0.0.85.dev821.dist-info/METADATA,sha256=mkEkQu0dIz-W8gqGGXsrqlfcD_AzqceP8-vCK0UgMfY,32924
-dv_pipecat_ai-0.0.85.dev821.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
-dv_pipecat_ai-0.0.85.dev821.dist-info/top_level.txt,sha256=kQzG20CxGf-nSsHmtXHx3hY2-8zHA3jYg8jk0TajqXc,8
-dv_pipecat_ai-0.0.85.dev821.dist-info/RECORD,,
+dv_pipecat_ai-0.0.85.dev823.dist-info/METADATA,sha256=QzFZChlDc4joKwMeDE3JSyM7EQzpJLPuIyfsNhrVgzE,32924
+dv_pipecat_ai-0.0.85.dev823.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
+dv_pipecat_ai-0.0.85.dev823.dist-info/top_level.txt,sha256=kQzG20CxGf-nSsHmtXHx3hY2-8zHA3jYg8jk0TajqXc,8
+dv_pipecat_ai-0.0.85.dev823.dist-info/RECORD,,

pipecat/frames/frames.py CHANGED Viewed

@@ -457,6 +457,7 @@ class TranscriptionMessage:
     content: str
     user_id: Optional[str] = None
     timestamp: Optional[str] = None
+    message_id: Optional[int] = None
 @dataclass
@@ -510,6 +511,17 @@ class TranscriptionUpdateFrame(DataFrame):
         return f"{self.name}(pts: {pts}, messages: {len(self.messages)})"
+@dataclass
+class TranscriptDropFrame(DataFrame):
+    """Frame indicating previously emitted transcript chunks should be discarded.
+    Parameters:
+        transcript_ids: List of frame/message identifiers to drop.
+    """
+    transcript_ids: List[int]
 @dataclass
 class LLMContextFrame(Frame):
     """Frame containing a universal LLM context.

pipecat/processors/aggregators/llm_response.py CHANGED Viewed

@@ -48,9 +48,10 @@ from pipecat.frames.frames import (
     LLMTextFrame,
     OpenAILLMContextAssistantTimestampFrame,
     SpeechControlParamsFrame,
-    StartInterruptionFrame,
     StartFrame,
+    StartInterruptionFrame,
     TextFrame,
+    TranscriptDropFrame,
     TranscriptionFrame,
     UserImageRawFrame,
     UserStartedSpeakingFrame,
@@ -446,6 +447,7 @@ class LLMUserContextAggregator(LLMContextResponseAggregator):
         self._latest_final_transcript = ""
         self._last_user_speaking_time = 0
         self._last_aggregation_push_time = 0
+        self._pending_transcription_ids: List[int] = []
     async def reset(self):
         """Reset the aggregation state and interruption strategies."""
@@ -453,6 +455,7 @@ class LLMUserContextAggregator(LLMContextResponseAggregator):
         self._was_bot_speaking = False
         self._seen_interim_results = False
         self._waiting_for_aggregation = False
+        self._pending_transcription_ids.clear()
         [await s.reset() for s in self._interruption_strategies]
     async def handle_aggregation(self, aggregation: str):
@@ -588,6 +591,17 @@ class LLMUserContextAggregator(LLMContextResponseAggregator):
         return any([await should_interrupt(s) for s in self._interruption_strategies])
+    async def _discard_pending_transcriptions(self, reason: str):
+        """Notify upstream processors that pending transcripts should be dropped."""
+        if self._pending_transcription_ids:
+            drop_frame = TranscriptDropFrame(transcript_ids=list(self._pending_transcription_ids))
+            self.logger.debug(
+                f"Dropping {len(self._pending_transcription_ids)} transcript chunk(s) due to {reason}"
+            )
+            await self.push_frame(drop_frame, FrameDirection.UPSTREAM)
+        self._pending_transcription_ids.clear()
+        self._aggregation = ""
     async def _start(self, frame: StartFrame):
         self._create_aggregation_task()
@@ -616,8 +630,7 @@ class LLMUserContextAggregator(LLMContextResponseAggregator):
     async def _handle_user_started_speaking(self, frame: UserStartedSpeakingFrame):
         if len(self._aggregation) > 0:
-            self.logger.debug(f"Dropping {self._aggregation}")
-            self._aggregation = ""
+            await self._discard_pending_transcriptions("user_started_speaking")
         self._latest_final_transcript = ""
         self._last_user_speaking_time = time.time()
         self._user_speaking = True
@@ -662,6 +675,7 @@ class LLMUserContextAggregator(LLMContextResponseAggregator):
             return
         self._aggregation += f" {text}" if self._aggregation else text
+        self._pending_transcription_ids.append(frame.id)
         # We just got a final result, so let's reset interim results.
         self._seen_interim_results = False

pipecat/processors/frame_processor.py CHANGED Viewed

@@ -591,7 +591,7 @@ class FrameProcessor(BaseObject):
     async def pause_processing_system_frames(self):
         """Pause processing of queued system frames."""
-        logger.trace(f"{self}: pausing system frame processing")
+        self.logger.trace(f"{self}: pausing system frame processing")
         self.__should_block_system_frames = True
         if self.__input_event:
             self.__input_event.clear()
@@ -812,7 +812,7 @@ class FrameProcessor(BaseObject):
             True if the processor has been started.
         """
         if not self.__started:
-            logger.error(f"{self} Trying to process {frame} but StartFrame not received yet")
+            self.logger.error(f"{self} Trying to process {frame} but StartFrame not received yet")
         return self.__started
     def __create_input_task(self):
@@ -876,7 +876,7 @@ class FrameProcessor(BaseObject):
             await self._call_event_handler("on_after_process_frame", frame)
         except Exception as e:
-            logger.exception(f"{self}: error processing frame: {e}")
+            self.logger.exception(f"{self}: error processing frame: {e}")
             await self.push_error(ErrorFrame(str(e)))
     async def __input_frame_task_handler(self):
@@ -890,11 +890,11 @@ class FrameProcessor(BaseObject):
             (frame, direction, callback) = await self.__input_queue.get()
             if self.__should_block_system_frames and self.__input_event:
-                logger.trace(f"{self}: system frame processing paused")
+                self.logger.trace(f"{self}: system frame processing paused")
                 await self.__input_event.wait()
                 self.__input_event.clear()
                 self.__should_block_system_frames = False
-                logger.trace(f"{self}: system frame processing resumed")
+                self.logger.trace(f"{self}: system frame processing resumed")
             if isinstance(frame, SystemFrame):
                 await self.__process_frame(frame, direction, callback)
@@ -913,11 +913,11 @@ class FrameProcessor(BaseObject):
             (frame, direction, callback) = await self.__process_queue.get()
             if self.__should_block_frames and self.__process_event:
-                logger.trace(f"{self}: frame processing paused")
+                self.logger.trace(f"{self}: frame processing paused")
                 await self.__process_event.wait()
                 self.__process_event.clear()
                 self.__should_block_frames = False
-                logger.trace(f"{self}: frame processing resumed")
+                self.logger.trace(f"{self}: frame processing resumed")
             await self.__process_frame(frame, direction, callback)

pipecat/processors/transcript_processor.py CHANGED Viewed

@@ -20,6 +20,7 @@ from pipecat.frames.frames import (
     EndFrame,
     Frame,
     InterruptionFrame,
+    TranscriptDropFrame,
     TranscriptionFrame,
     TranscriptionMessage,
     TranscriptionUpdateFrame,
@@ -44,6 +45,7 @@ class BaseTranscriptProcessor(FrameProcessor):
         super().__init__(**kwargs)
         self._processed_messages: List[TranscriptionMessage] = []
         self._register_event_handler("on_transcript_update")
+        self._register_event_handler("on_transcript_drop")
     async def _emit_update(self, messages: List[TranscriptionMessage]):
         """Emit transcript updates for new messages.
@@ -57,6 +59,18 @@ class BaseTranscriptProcessor(FrameProcessor):
             await self._call_event_handler("on_transcript_update", update_frame)
             await self.push_frame(update_frame)
+    async def _handle_transcript_drop(self, frame: TranscriptDropFrame):
+        """Handle transcript drop notifications by removing stored messages."""
+        if not frame.transcript_ids:
+            return
+        drop_ids = set(frame.transcript_ids)
+        if drop_ids:
+            self._processed_messages = [
+                msg for msg in self._processed_messages if msg.message_id not in drop_ids
+            ]
+            await self._call_event_handler("on_transcript_drop", frame)
 class UserTranscriptProcessor(BaseTranscriptProcessor):
     """Processes user transcription frames into timestamped conversation messages."""
@@ -72,9 +86,15 @@ class UserTranscriptProcessor(BaseTranscriptProcessor):
         if isinstance(frame, TranscriptionFrame):
             message = TranscriptionMessage(
-                role="user", user_id=frame.user_id, content=frame.text, timestamp=frame.timestamp
+                role="user",
+                user_id=frame.user_id,
+                content=frame.text,
+                timestamp=frame.timestamp,
+                message_id=frame.id,
             )
             await self._emit_update([message])
+        elif isinstance(frame, TranscriptDropFrame):
+            await self._handle_transcript_drop(frame)
         await self.push_frame(frame, direction)

{dv_pipecat_ai-0.0.85.dev821.dist-info → dv_pipecat_ai-0.0.85.dev823.dist-info}/WHEEL RENAMED Viewed

File without changes

{dv_pipecat_ai-0.0.85.dev821.dist-info → dv_pipecat_ai-0.0.85.dev823.dist-info}/licenses/LICENSE RENAMED Viewed

File without changes

{dv_pipecat_ai-0.0.85.dev821.dist-info → dv_pipecat_ai-0.0.85.dev823.dist-info}/top_level.txt RENAMED Viewed

File without changes

dv-pipecat-ai 0.0.85.dev821__py3-none-any.whl → 0.0.85.dev823__py3-none-any.whl

Potentially problematic release.

dv-pipecat-ai 0.0.85.dev821py3-none-any.whl → 0.0.85.dev823py3-none-any.whl