PyPI - dv-pipecat-ai - Versions diffs - 0.0.74.dev770__py3-none-any.whl → 0.0.82.dev776__py3-none-any.whl - Mend

dv-pipecat-ai 0.0.74.dev770py3-none-any.whl → 0.0.82.dev776py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of dv-pipecat-ai might be problematic. Click here for more details.

Files changed (244) hide show

{dv_pipecat_ai-0.0.74.dev770.dist-info → dv_pipecat_ai-0.0.82.dev776.dist-info}/METADATA +137 -93
dv_pipecat_ai-0.0.82.dev776.dist-info/RECORD +340 -0
pipecat/__init__.py +17 -0
pipecat/adapters/base_llm_adapter.py +36 -1
pipecat/adapters/schemas/direct_function.py +296 -0
pipecat/adapters/schemas/function_schema.py +15 -6
pipecat/adapters/schemas/tools_schema.py +55 -7
pipecat/adapters/services/anthropic_adapter.py +22 -3
pipecat/adapters/services/aws_nova_sonic_adapter.py +23 -3
pipecat/adapters/services/bedrock_adapter.py +22 -3
pipecat/adapters/services/gemini_adapter.py +16 -3
pipecat/adapters/services/open_ai_adapter.py +17 -2
pipecat/adapters/services/open_ai_realtime_adapter.py +23 -3
pipecat/audio/filters/base_audio_filter.py +30 -6
pipecat/audio/filters/koala_filter.py +37 -2
pipecat/audio/filters/krisp_filter.py +59 -6
pipecat/audio/filters/noisereduce_filter.py +37 -0
pipecat/audio/interruptions/base_interruption_strategy.py +25 -5
pipecat/audio/interruptions/min_words_interruption_strategy.py +21 -4
pipecat/audio/mixers/base_audio_mixer.py +30 -7
pipecat/audio/mixers/soundfile_mixer.py +53 -6
pipecat/audio/resamplers/base_audio_resampler.py +17 -9
pipecat/audio/resamplers/resampy_resampler.py +26 -1
pipecat/audio/resamplers/soxr_resampler.py +32 -1
pipecat/audio/resamplers/soxr_stream_resampler.py +101 -0
pipecat/audio/utils.py +194 -1
pipecat/audio/vad/silero.py +60 -3
pipecat/audio/vad/vad_analyzer.py +114 -30
pipecat/clocks/base_clock.py +19 -0
pipecat/clocks/system_clock.py +25 -0
pipecat/extensions/voicemail/__init__.py +0 -0
pipecat/extensions/voicemail/voicemail_detector.py +707 -0
pipecat/frames/frames.py +590 -156
pipecat/metrics/metrics.py +64 -1
pipecat/observers/base_observer.py +58 -19
pipecat/observers/loggers/debug_log_observer.py +56 -64
pipecat/observers/loggers/llm_log_observer.py +8 -1
pipecat/observers/loggers/transcription_log_observer.py +19 -7
pipecat/observers/loggers/user_bot_latency_log_observer.py +32 -5
pipecat/observers/turn_tracking_observer.py +26 -1
pipecat/pipeline/base_pipeline.py +5 -7
pipecat/pipeline/base_task.py +52 -9
pipecat/pipeline/parallel_pipeline.py +121 -177
pipecat/pipeline/pipeline.py +129 -20
pipecat/pipeline/runner.py +50 -1
pipecat/pipeline/sync_parallel_pipeline.py +132 -32
pipecat/pipeline/task.py +263 -280
pipecat/pipeline/task_observer.py +85 -34
pipecat/pipeline/to_be_updated/merge_pipeline.py +32 -2
pipecat/processors/aggregators/dtmf_aggregator.py +29 -22
pipecat/processors/aggregators/gated.py +25 -24
pipecat/processors/aggregators/gated_openai_llm_context.py +22 -2
pipecat/processors/aggregators/llm_response.py +398 -89
pipecat/processors/aggregators/openai_llm_context.py +161 -13
pipecat/processors/aggregators/sentence.py +25 -14
pipecat/processors/aggregators/user_response.py +28 -3
pipecat/processors/aggregators/vision_image_frame.py +24 -14
pipecat/processors/async_generator.py +28 -0
pipecat/processors/audio/audio_buffer_processor.py +78 -37
pipecat/processors/consumer_processor.py +25 -6
pipecat/processors/filters/frame_filter.py +23 -0
pipecat/processors/filters/function_filter.py +30 -0
pipecat/processors/filters/identity_filter.py +17 -2
pipecat/processors/filters/null_filter.py +24 -1
pipecat/processors/filters/stt_mute_filter.py +56 -21
pipecat/processors/filters/wake_check_filter.py +46 -3
pipecat/processors/filters/wake_notifier_filter.py +21 -3
pipecat/processors/frame_processor.py +488 -131
pipecat/processors/frameworks/langchain.py +38 -3
pipecat/processors/frameworks/rtvi.py +719 -34
pipecat/processors/gstreamer/pipeline_source.py +41 -0
pipecat/processors/idle_frame_processor.py +26 -3
pipecat/processors/logger.py +23 -0
pipecat/processors/metrics/frame_processor_metrics.py +77 -4
pipecat/processors/metrics/sentry.py +42 -4
pipecat/processors/producer_processor.py +34 -14
pipecat/processors/text_transformer.py +22 -10
pipecat/processors/transcript_processor.py +48 -29
pipecat/processors/user_idle_processor.py +31 -21
pipecat/runner/__init__.py +1 -0
pipecat/runner/daily.py +132 -0
pipecat/runner/livekit.py +148 -0
pipecat/runner/run.py +543 -0
pipecat/runner/types.py +67 -0
pipecat/runner/utils.py +515 -0
pipecat/serializers/base_serializer.py +42 -0
pipecat/serializers/exotel.py +17 -6
pipecat/serializers/genesys.py +95 -0
pipecat/serializers/livekit.py +33 -0
pipecat/serializers/plivo.py +16 -15
pipecat/serializers/protobuf.py +37 -1
pipecat/serializers/telnyx.py +18 -17
pipecat/serializers/twilio.py +32 -16
pipecat/services/ai_service.py +5 -3
pipecat/services/anthropic/llm.py +113 -43
pipecat/services/assemblyai/models.py +63 -5
pipecat/services/assemblyai/stt.py +64 -11
pipecat/services/asyncai/__init__.py +0 -0
pipecat/services/asyncai/tts.py +501 -0
pipecat/services/aws/llm.py +185 -111
pipecat/services/aws/stt.py +217 -23
pipecat/services/aws/tts.py +118 -52
pipecat/services/aws/utils.py +101 -5
pipecat/services/aws_nova_sonic/aws.py +82 -64
pipecat/services/aws_nova_sonic/context.py +15 -6
pipecat/services/azure/common.py +10 -2
pipecat/services/azure/image.py +32 -0
pipecat/services/azure/llm.py +9 -7
pipecat/services/azure/stt.py +65 -2
pipecat/services/azure/tts.py +154 -23
pipecat/services/cartesia/stt.py +125 -8
pipecat/services/cartesia/tts.py +102 -38
pipecat/services/cerebras/llm.py +15 -23
pipecat/services/deepgram/stt.py +19 -11
pipecat/services/deepgram/tts.py +36 -0
pipecat/services/deepseek/llm.py +14 -23
pipecat/services/elevenlabs/tts.py +330 -64
pipecat/services/fal/image.py +43 -0
pipecat/services/fal/stt.py +48 -10
pipecat/services/fireworks/llm.py +14 -21
pipecat/services/fish/tts.py +109 -9
pipecat/services/gemini_multimodal_live/__init__.py +1 -0
pipecat/services/gemini_multimodal_live/events.py +83 -2
pipecat/services/gemini_multimodal_live/file_api.py +189 -0
pipecat/services/gemini_multimodal_live/gemini.py +218 -21
pipecat/services/gladia/config.py +17 -10
pipecat/services/gladia/stt.py +82 -36
pipecat/services/google/frames.py +40 -0
pipecat/services/google/google.py +2 -0
pipecat/services/google/image.py +39 -2
pipecat/services/google/llm.py +176 -58
pipecat/services/google/llm_openai.py +26 -4
pipecat/services/google/llm_vertex.py +37 -15
pipecat/services/google/rtvi.py +41 -0
pipecat/services/google/stt.py +65 -17
pipecat/services/google/test-google-chirp.py +45 -0
pipecat/services/google/tts.py +390 -19
pipecat/services/grok/llm.py +8 -6
pipecat/services/groq/llm.py +8 -6
pipecat/services/groq/stt.py +13 -9
pipecat/services/groq/tts.py +40 -0
pipecat/services/hamsa/__init__.py +9 -0
pipecat/services/hamsa/stt.py +241 -0
pipecat/services/heygen/__init__.py +5 -0
pipecat/services/heygen/api.py +281 -0
pipecat/services/heygen/client.py +620 -0
pipecat/services/heygen/video.py +338 -0
pipecat/services/image_service.py +5 -3
pipecat/services/inworld/__init__.py +1 -0
pipecat/services/inworld/tts.py +592 -0
pipecat/services/llm_service.py +127 -45
pipecat/services/lmnt/tts.py +80 -7
pipecat/services/mcp_service.py +85 -44
pipecat/services/mem0/memory.py +42 -13
pipecat/services/minimax/tts.py +74 -15
pipecat/services/mistral/__init__.py +0 -0
pipecat/services/mistral/llm.py +185 -0
pipecat/services/moondream/vision.py +55 -10
pipecat/services/neuphonic/tts.py +275 -48
pipecat/services/nim/llm.py +8 -6
pipecat/services/ollama/llm.py +27 -7
pipecat/services/openai/base_llm.py +54 -16
pipecat/services/openai/image.py +30 -0
pipecat/services/openai/llm.py +7 -5
pipecat/services/openai/stt.py +13 -9
pipecat/services/openai/tts.py +42 -10
pipecat/services/openai_realtime_beta/azure.py +11 -9
pipecat/services/openai_realtime_beta/context.py +7 -5
pipecat/services/openai_realtime_beta/events.py +10 -7
pipecat/services/openai_realtime_beta/openai.py +37 -18
pipecat/services/openpipe/llm.py +30 -24
pipecat/services/openrouter/llm.py +9 -7
pipecat/services/perplexity/llm.py +15 -19
pipecat/services/piper/tts.py +26 -12
pipecat/services/playht/tts.py +227 -65
pipecat/services/qwen/llm.py +8 -6
pipecat/services/rime/tts.py +128 -17
pipecat/services/riva/stt.py +160 -22
pipecat/services/riva/tts.py +67 -2
pipecat/services/sambanova/llm.py +19 -17
pipecat/services/sambanova/stt.py +14 -8
pipecat/services/sarvam/tts.py +60 -13
pipecat/services/simli/video.py +82 -21
pipecat/services/soniox/__init__.py +0 -0
pipecat/services/soniox/stt.py +398 -0
pipecat/services/speechmatics/stt.py +29 -17
pipecat/services/stt_service.py +47 -11
pipecat/services/tavus/video.py +94 -25
pipecat/services/together/llm.py +8 -6
pipecat/services/tts_service.py +77 -53
pipecat/services/ultravox/stt.py +46 -43
pipecat/services/vision_service.py +5 -3
pipecat/services/websocket_service.py +12 -11
pipecat/services/whisper/base_stt.py +58 -12
pipecat/services/whisper/stt.py +69 -58
pipecat/services/xtts/tts.py +59 -2
pipecat/sync/base_notifier.py +19 -0
pipecat/sync/event_notifier.py +24 -0
pipecat/tests/utils.py +73 -5
pipecat/transcriptions/language.py +24 -0
pipecat/transports/base_input.py +112 -8
pipecat/transports/base_output.py +235 -13
pipecat/transports/base_transport.py +119 -0
pipecat/transports/local/audio.py +76 -0
pipecat/transports/local/tk.py +84 -0
pipecat/transports/network/fastapi_websocket.py +174 -15
pipecat/transports/network/small_webrtc.py +383 -39
pipecat/transports/network/webrtc_connection.py +214 -8
pipecat/transports/network/websocket_client.py +171 -1
pipecat/transports/network/websocket_server.py +147 -9
pipecat/transports/services/daily.py +792 -70
pipecat/transports/services/helpers/daily_rest.py +122 -129
pipecat/transports/services/livekit.py +339 -4
pipecat/transports/services/tavus.py +273 -38
pipecat/utils/asyncio/task_manager.py +92 -186
pipecat/utils/base_object.py +83 -1
pipecat/utils/network.py +2 -0
pipecat/utils/string.py +114 -58
pipecat/utils/text/base_text_aggregator.py +44 -13
pipecat/utils/text/base_text_filter.py +46 -0
pipecat/utils/text/markdown_text_filter.py +70 -14
pipecat/utils/text/pattern_pair_aggregator.py +18 -14
pipecat/utils/text/simple_text_aggregator.py +43 -2
pipecat/utils/text/skip_tags_aggregator.py +21 -13
pipecat/utils/time.py +36 -0
pipecat/utils/tracing/class_decorators.py +32 -7
pipecat/utils/tracing/conversation_context_provider.py +12 -2
pipecat/utils/tracing/service_attributes.py +80 -64
pipecat/utils/tracing/service_decorators.py +48 -21
pipecat/utils/tracing/setup.py +13 -7
pipecat/utils/tracing/turn_context_provider.py +12 -2
pipecat/utils/tracing/turn_trace_observer.py +27 -0
pipecat/utils/utils.py +14 -14
dv_pipecat_ai-0.0.74.dev770.dist-info/RECORD +0 -319
pipecat/examples/daily_runner.py +0 -64
pipecat/examples/run.py +0 -265
pipecat/utils/asyncio/watchdog_async_iterator.py +0 -72
pipecat/utils/asyncio/watchdog_event.py +0 -42
pipecat/utils/asyncio/watchdog_priority_queue.py +0 -48
pipecat/utils/asyncio/watchdog_queue.py +0 -48
{dv_pipecat_ai-0.0.74.dev770.dist-info → dv_pipecat_ai-0.0.82.dev776.dist-info}/WHEEL +0 -0
{dv_pipecat_ai-0.0.74.dev770.dist-info → dv_pipecat_ai-0.0.82.dev776.dist-info}/licenses/LICENSE +0 -0
{dv_pipecat_ai-0.0.74.dev770.dist-info → dv_pipecat_ai-0.0.82.dev776.dist-info}/top_level.txt +0 -0
/pipecat/{examples → extensions}/__init__.py +0 -0

pipecat/processors/aggregators/openai_llm_context.py CHANGED Viewed

@@ -4,6 +4,12 @@
 # SPDX-License-Identifier: BSD 2-Clause License
 #
+"""OpenAI LLM context management for Pipecat.
+This module provides classes for managing OpenAI-specific conversation contexts,
+including message handling, tool management, and image/audio processing capabilities.
+"""
 import base64
 import copy
 import io
@@ -29,7 +35,21 @@ from pipecat.processors.frame_processor import FrameDirection, FrameProcessor
 class CustomEncoder(json.JSONEncoder):
+    """Custom JSON encoder for handling special data types in logging.
+    Provides specialized encoding for io.BytesIO objects to display
+    readable representations in log output instead of raw binary data.
+    """
     def default(self, obj):
+        """Encode special objects for JSON serialization.
+        Args:
+            obj: The object to encode.
+        Returns:
+            Encoded representation of the object.
+        """
         if isinstance(obj, io.BytesIO):
             # Convert the first 8 bytes to an ASCII hex string
             return f"{obj.getbuffer()[0:8].hex()}..."
@@ -37,63 +57,140 @@ class CustomEncoder(json.JSONEncoder):
 class OpenAILLMContext:
+    """Manages conversation context for OpenAI LLM interactions.
+    Handles message history, tool definitions, tool choices, and multimedia content
+    for OpenAI API conversations. Provides methods for message manipulation,
+    content formatting, and integration with various LLM adapters.
+    """
     def __init__(
         self,
         messages: Optional[List[ChatCompletionMessageParam]] = None,
         tools: List[ChatCompletionToolParam] | NotGiven | ToolsSchema = NOT_GIVEN,
         tool_choice: ChatCompletionToolChoiceOptionParam | NotGiven = NOT_GIVEN,
     ):
+        """Initialize the OpenAI LLM context.
+        Args:
+            messages: Initial list of conversation messages.
+            tools: Available tools for the LLM to use.
+            tool_choice: Tool selection strategy for the LLM.
+        """
         self._messages: List[ChatCompletionMessageParam] = messages if messages else []
         self._tool_choice: ChatCompletionToolChoiceOptionParam | NotGiven = tool_choice
         self._tools: List[ChatCompletionToolParam] | NotGiven | ToolsSchema = tools
         self._llm_adapter: Optional[BaseLLMAdapter] = None
     def get_llm_adapter(self) -> Optional[BaseLLMAdapter]:
+        """Get the current LLM adapter.
+        Returns:
+            The currently set LLM adapter, or None if not set.
+        """
         return self._llm_adapter
     def set_llm_adapter(self, llm_adapter: BaseLLMAdapter):
+        """Set the LLM adapter for context processing.
+        Args:
+            llm_adapter: The LLM adapter to use for tool conversion.
+        """
         self._llm_adapter = llm_adapter
     @staticmethod
     def from_messages(messages: List[dict]) -> "OpenAILLMContext":
+        """Create a context from a list of message dictionaries.
+        Args:
+            messages: List of message dictionaries to convert to context.
+        Returns:
+            New OpenAILLMContext instance with the provided messages.
+        """
         context = OpenAILLMContext()
         for message in messages:
-            if "name" not in message:
-                message["name"] = message["role"]
             context.add_message(message)
         return context
     @property
     def messages(self) -> List[ChatCompletionMessageParam]:
+        """Get the current messages list.
+        Returns:
+            List of conversation messages.
+        """
         return self._messages
     @property
     def tools(self) -> List[ChatCompletionToolParam] | NotGiven | List[Any]:
+        """Get the tools list, converting through adapter if available.
+        Returns:
+            Tools list, potentially converted by the LLM adapter.
+        """
         if self._llm_adapter:
             return self._llm_adapter.from_standard_tools(self._tools)
         return self._tools
     @property
     def tool_choice(self) -> ChatCompletionToolChoiceOptionParam | NotGiven:
+        """Get the current tool choice setting.
+        Returns:
+            The tool choice configuration.
+        """
         return self._tool_choice
     def add_message(self, message: ChatCompletionMessageParam):
+        """Add a single message to the context.
+        Args:
+            message: The message to add to the conversation history.
+        """
         self._messages.append(message)
     def add_messages(self, messages: List[ChatCompletionMessageParam]):
+        """Add multiple messages to the context.
+        Args:
+            messages: List of messages to add to the conversation history.
+        """
         self._messages.extend(messages)
     def set_messages(self, messages: List[ChatCompletionMessageParam]):
+        """Replace all messages in the context.
+        Args:
+            messages: New list of messages to replace the current history.
+        """
         self._messages[:] = messages
     def get_messages(self) -> List[ChatCompletionMessageParam]:
+        """Get a copy of the current messages list.
+        Returns:
+            List of all messages in the conversation history.
+        """
         return self._messages
     def get_messages_json(self) -> str:
+        """Get messages as a formatted JSON string.
+        Returns:
+            JSON string representation of all messages with custom encoding.
+        """
         return json.dumps(self._messages, cls=CustomEncoder, ensure_ascii=False, indent=2)
     def get_messages_for_logging(self) -> str:
+        """Get sanitized messages suitable for logging.
+        Removes or truncates sensitive data like image content for safe logging.
+        Returns:
+            JSON string with sanitized message content for logging.
+        """
         msgs = []
         for message in self.messages:
             msg = copy.deepcopy(message)
@@ -116,17 +213,18 @@ class OpenAILLMContext:
     def from_standard_message(self, message):
         """Convert from OpenAI message format to OpenAI message format (passthrough).
-        OpenAI's format allows both simple string content and structured content:
-        - Simple: {"role": "user", "content": "Hello"}
-        - Structured: {"role": "user", "content": [{"type": "text", "text": "Hello"}]}
+        OpenAI's format allows both simple string content and structured content::
+            Simple: {"role": "user", "content": "Hello"}
+            Structured: {"role": "user", "content": [{"type": "text", "text": "Hello"}]}
         Since OpenAI is our standard format, this is a passthrough function.
         Args:
-            message (dict): Message in OpenAI format
+            message: Message in OpenAI format.
         Returns:
-            dict: Same message, unchanged
+            Same message, unchanged.
         """
         return message
@@ -138,20 +236,28 @@ class OpenAILLMContext:
         other LLM services that may need to return multiple messages.
         Args:
-            obj (dict): Message in OpenAI format with either:
-                - Simple content: {"role": "user", "content": "Hello"}
-                - List content: {"role": "user", "content": [{"type": "text", "text": "Hello"}]}
+            obj: Message in OpenAI format with either simple string content
+                or structured list content.
         Returns:
-            list: List containing the original messages, preserving whether
-                the content was in simple string or structured list format
+            List containing the original messages, preserving the content format.
         """
         return [obj]
     def get_messages_for_initializing_history(self):
+        """Get messages for initializing conversation history.
+        Returns:
+            List of messages suitable for history initialization.
+        """
         return self._messages
     def get_messages_for_persistent_storage(self):
+        """Get messages formatted for persistent storage.
+        Returns:
+            List of messages converted to standard format for storage.
+        """
         messages = []
         for m in self._messages:
             standard_messages = self.to_standard_messages(m)
@@ -159,9 +265,19 @@ class OpenAILLMContext:
         return messages
     def set_tool_choice(self, tool_choice: ChatCompletionToolChoiceOptionParam | NotGiven):
+        """Set the tool choice configuration.
+        Args:
+            tool_choice: Tool selection strategy for the LLM.
+        """
         self._tool_choice = tool_choice
     def set_tools(self, tools: List[ChatCompletionToolParam] | NotGiven | ToolsSchema = NOT_GIVEN):
+        """Set the available tools for the LLM.
+        Args:
+            tools: List of tools available to the LLM, or NOT_GIVEN to disable tools.
+        """
         if tools != NOT_GIVEN and isinstance(tools, list) and len(tools) == 0:
             tools = NOT_GIVEN
         self._tools = tools
@@ -169,6 +285,14 @@ class OpenAILLMContext:
     def add_image_frame_message(
         self, *, format: str, size: tuple[int, int], image: bytes, text: str = None
     ):
+        """Add a message containing an image frame.
+        Args:
+            format: Image format (e.g., 'RGB', 'RGBA').
+            size: Image dimensions as (width, height) tuple.
+            image: Raw image bytes.
+            text: Optional text to include with the image.
+        """
         buffer = io.BytesIO()
         Image.frombytes(format, size, image).save(buffer, format="JPEG")
         encoded_image = base64.b64encode(buffer.getvalue()).decode("utf-8")
@@ -182,10 +306,30 @@ class OpenAILLMContext:
         self.add_message({"role": "user", "content": content})
     def add_audio_frames_message(self, *, audio_frames: list[AudioRawFrame], text: str = None):
+        """Add a message containing audio frames.
+        Args:
+            audio_frames: List of audio frame objects to include.
+            text: Optional text to include with the audio.
+        Note:
+            This method is currently a placeholder for future implementation.
+        """
         # todo: implement for OpenAI models and others
         pass
     def create_wav_header(self, sample_rate, num_channels, bits_per_sample, data_size):
+        """Create a WAV file header for audio data.
+        Args:
+            sample_rate: Audio sample rate in Hz.
+            num_channels: Number of audio channels.
+            bits_per_sample: Bits per audio sample.
+            data_size: Size of audio data in bytes.
+        Returns:
+            WAV header as a bytearray.
+        """
         # RIFF chunk descriptor
         header = bytearray()
         header.extend(b"RIFF")  # ChunkID
@@ -211,10 +355,14 @@ class OpenAILLMContext:
 @dataclass
 class OpenAILLMContextFrame(Frame):
-    """Like an LLMMessagesFrame, but with extra context specific to the OpenAI
+    """Frame containing OpenAI-specific LLM context.
+    Like an LLMMessagesFrame, but with extra context specific to the OpenAI
     API. The context in this message is also mutable, and will be changed by the
     OpenAIContextAggregator frame processor.
+    Parameters:
+        context: The OpenAI LLM context containing messages, tools, and configuration.
     """
     context: OpenAILLMContext

pipecat/processors/aggregators/sentence.py CHANGED Viewed

@@ -4,35 +4,46 @@
 # SPDX-License-Identifier: BSD 2-Clause License
 #
+"""Text sentence aggregation processor for Pipecat.
+This module provides a frame processor that accumulates text frames into
+complete sentences, only outputting when a sentence-ending pattern is detected.
+"""
 from pipecat.frames.frames import EndFrame, Frame, InterimTranscriptionFrame, TextFrame
 from pipecat.processors.frame_processor import FrameDirection, FrameProcessor
 from pipecat.utils.string import match_endofsentence
 class SentenceAggregator(FrameProcessor):
-    """This frame processor aggregates text frames into complete sentences.
+    """Aggregates text frames into complete sentences.
+    This processor accumulates incoming text frames until a sentence-ending
+    pattern is detected, then outputs the complete sentence as a single frame.
+    Useful for ensuring downstream processors receive coherent, complete sentences
+    rather than fragmented text.
+    Frame input/output::
-    Frame input/output:
         TextFrame("Hello,") -> None
-        TextFrame(" world.") -> TextFrame("Hello world.")
-    Doctest: FIXME to work with asyncio
-    >>> import asyncio
-    >>> async def print_frames(aggregator, frame):
-    ...     async for frame in aggregator.process_frame(frame):
-    ...         print(frame.text)
-    >>> aggregator = SentenceAggregator()
-    >>> asyncio.run(print_frames(aggregator, TextFrame("Hello,")))
-    >>> asyncio.run(print_frames(aggregator, TextFrame(" world.")))
-    Hello, world.
+        TextFrame(" world.") -> TextFrame("Hello, world.")
     """
     def __init__(self):
+        """Initialize the sentence aggregator.
+        Sets up internal state for accumulating text frames into complete sentences.
+        """
         super().__init__()
         self._aggregation = ""
     async def process_frame(self, frame: Frame, direction: FrameDirection):
+        """Process incoming frames and aggregate text into complete sentences.
+        Args:
+            frame: The incoming frame to process.
+            direction: The direction of frame flow in the pipeline.
+        """
         await super().process_frame(frame, direction)
         # We ignore interim description at this point.

pipecat/processors/aggregators/user_response.py CHANGED Viewed

@@ -4,15 +4,40 @@
 # SPDX-License-Identifier: BSD 2-Clause License
 #
+"""User response aggregation for text frames.
+This module provides an aggregator that collects user responses and outputs
+them as TextFrame objects, useful for capturing and processing user input
+in conversational pipelines.
+"""
 from pipecat.frames.frames import TextFrame
-from pipecat.processors.aggregators.llm_response import LLMUserResponseAggregator
+from pipecat.processors.aggregators.llm_response import LLMUserContextAggregator
+from pipecat.processors.aggregators.openai_llm_context import OpenAILLMContext
+class UserResponseAggregator(LLMUserContextAggregator):
+    """Aggregates user responses into TextFrame objects.
+    This aggregator extends LLMUserContextAggregator to specifically handle
+    user input by collecting text responses and outputting them as TextFrame
+    objects when the aggregation is complete.
+    """
-class UserResponseAggregator(LLMUserResponseAggregator):
     def __init__(self, **kwargs):
-        super().__init__(**kwargs)
+        """Initialize the user response aggregator.
+        Args:
+            **kwargs: Additional arguments passed to parent LLMUserContextAggregator.
+        """
+        super().__init__(context=OpenAILLMContext(), **kwargs)
     async def push_aggregation(self):
+        """Push the aggregated user response as a TextFrame.
+        Creates a TextFrame from the current aggregation if it contains content,
+        resets the aggregation state, and pushes the frame downstream.
+        """
         if len(self._aggregation) > 0:
             frame = TextFrame(self._aggregation.strip())

pipecat/processors/aggregators/vision_image_frame.py CHANGED Viewed

@@ -4,33 +4,43 @@
 # SPDX-License-Identifier: BSD 2-Clause License
 #
+"""Vision image frame aggregation for Pipecat.
+This module provides frame aggregation functionality to combine text and image
+frames into vision frames for multimodal processing.
+"""
 from pipecat.frames.frames import Frame, InputImageRawFrame, TextFrame, VisionImageRawFrame
 from pipecat.processors.frame_processor import FrameDirection, FrameProcessor
 class VisionImageFrameAggregator(FrameProcessor):
-    """This aggregator waits for a consecutive TextFrame and an
-    InputImageRawFrame. After the InputImageRawFrame arrives it will output a
-    VisionImageRawFrame.
-    >>> from pipecat.frames.frames import ImageFrame
-    >>> async def print_frames(aggregator, frame):
-    ...     async for frame in aggregator.process_frame(frame):
-    ...         print(frame)
-    >>> aggregator = VisionImageFrameAggregator()
-    >>> asyncio.run(print_frames(aggregator, TextFrame("What do you see?")))
-    >>> asyncio.run(print_frames(aggregator, ImageFrame(image=bytes([]), size=(0, 0))))
-    VisionImageFrame, text: What do you see?, image size: 0x0, buffer size: 0 B
+    """Aggregates consecutive text and image frames into vision frames.
+    This aggregator waits for a consecutive TextFrame and an InputImageRawFrame.
+    After the InputImageRawFrame arrives it will output a VisionImageRawFrame
+    combining both the text and image data for multimodal processing.
     """
     def __init__(self):
+        """Initialize the vision image frame aggregator.
+        The aggregator starts with no cached text, waiting for the first
+        TextFrame to arrive before it can create vision frames.
+        """
         super().__init__()
         self._describe_text = None
     async def process_frame(self, frame: Frame, direction: FrameDirection):
+        """Process incoming frames and aggregate text with images.
+        Caches TextFrames and combines them with subsequent InputImageRawFrames
+        to create VisionImageRawFrames. Other frames are passed through unchanged.
+        Args:
+            frame: The incoming frame to process.
+            direction: The direction of frame flow in the pipeline.
+        """
         await super().process_frame(frame, direction)
         if isinstance(frame, TextFrame):

pipecat/processors/async_generator.py CHANGED Viewed

@@ -4,6 +4,8 @@
 # SPDX-License-Identifier: BSD 2-Clause License
 #
+"""Async generator processor for frame serialization and streaming."""
 import asyncio
 from typing import Any, AsyncGenerator
@@ -17,12 +19,32 @@ from pipecat.serializers.base_serializer import FrameSerializer
 class AsyncGeneratorProcessor(FrameProcessor):
+    """A frame processor that serializes frames and provides them via async generator.
+    This processor passes frames through unchanged while simultaneously serializing
+    them and making the serialized data available through an async generator interface.
+    Useful for streaming frame data to external consumers while maintaining the
+    normal frame processing pipeline.
+    """
     def __init__(self, *, serializer: FrameSerializer, **kwargs):
+        """Initialize the async generator processor.
+        Args:
+            serializer: The frame serializer to use for converting frames to data.
+            **kwargs: Additional arguments passed to the parent FrameProcessor.
+        """
         super().__init__(**kwargs)
         self._serializer = serializer
         self._data_queue = asyncio.Queue()
     async def process_frame(self, frame: Frame, direction: FrameDirection):
+        """Process frames by passing them through and queuing serialized data.
+        Args:
+            frame: The frame to process.
+            direction: The direction of frame flow in the pipeline.
+        """
         await super().process_frame(frame, direction)
         await self.push_frame(frame, direction)
@@ -35,6 +57,12 @@ class AsyncGeneratorProcessor(FrameProcessor):
                 await self._data_queue.put(data)
     async def generator(self) -> AsyncGenerator[Any, None]:
+        """Generate serialized frame data asynchronously.
+        Yields:
+            Serialized frame data from the internal queue until a termination
+            signal (None) is received.
+        """
         running = True
         while running:
             data = await self._data_queue.get()

dv-pipecat-ai 0.0.74.dev770__py3-none-any.whl → 0.0.82.dev776__py3-none-any.whl

Potentially problematic release.

dv-pipecat-ai 0.0.74.dev770py3-none-any.whl → 0.0.82.dev776py3-none-any.whl