PyPI - letta-nightly - Versions diffs - 0.7.8.dev20250502104219__py3-none-any.whl → 0.7.9.dev20250502222710__py3-none-any.whl - Mend

letta-nightly 0.7.8.dev20250502104219py3-none-any.whl → 0.7.9.dev20250502222710py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (41) hide show

letta/__init__.py +2 -2
letta/agents/helpers.py +58 -1
letta/agents/letta_agent.py +13 -3
letta/agents/letta_agent_batch.py +33 -17
letta/agents/voice_agent.py +1 -2
letta/agents/voice_sleeptime_agent.py +75 -320
letta/functions/function_sets/multi_agent.py +1 -1
letta/functions/function_sets/voice.py +20 -32
letta/functions/helpers.py +7 -7
letta/helpers/datetime_helpers.py +6 -0
letta/helpers/message_helper.py +19 -18
letta/jobs/scheduler.py +233 -49
letta/llm_api/google_ai_client.py +13 -4
letta/llm_api/google_vertex_client.py +5 -1
letta/llm_api/openai.py +10 -2
letta/llm_api/openai_client.py +14 -2
letta/orm/message.py +4 -0
letta/prompts/system/voice_sleeptime.txt +2 -3
letta/schemas/letta_message.py +1 -0
letta/schemas/letta_request.py +8 -1
letta/schemas/letta_response.py +5 -0
letta/schemas/llm_batch_job.py +6 -4
letta/schemas/llm_config.py +9 -0
letta/schemas/message.py +23 -2
letta/schemas/providers.py +3 -1
letta/server/rest_api/app.py +15 -7
letta/server/rest_api/routers/v1/agents.py +3 -0
letta/server/rest_api/routers/v1/messages.py +46 -1
letta/server/rest_api/routers/v1/steps.py +1 -1
letta/server/rest_api/utils.py +25 -6
letta/server/server.py +11 -3
letta/services/llm_batch_manager.py +60 -1
letta/services/message_manager.py +1 -0
letta/services/summarizer/summarizer.py +42 -36
letta/settings.py +1 -0
letta/tracing.py +5 -0
{letta_nightly-0.7.8.dev20250502104219.dist-info → letta_nightly-0.7.9.dev20250502222710.dist-info}/METADATA +2 -2
{letta_nightly-0.7.8.dev20250502104219.dist-info → letta_nightly-0.7.9.dev20250502222710.dist-info}/RECORD +41 -41
{letta_nightly-0.7.8.dev20250502104219.dist-info → letta_nightly-0.7.9.dev20250502222710.dist-info}/LICENSE +0 -0
{letta_nightly-0.7.8.dev20250502104219.dist-info → letta_nightly-0.7.9.dev20250502222710.dist-info}/WHEEL +0 -0
{letta_nightly-0.7.8.dev20250502104219.dist-info → letta_nightly-0.7.9.dev20250502222710.dist-info}/entry_points.txt +0 -0

letta/agents/voice_sleeptime_agent.py CHANGED Viewed

@@ -1,332 +1,138 @@
-import json
-import xml.etree.ElementTree as ET
-from typing import AsyncGenerator, Dict, List, Optional, Tuple, Union
+from typing import AsyncGenerator, List, Tuple, Union
-import openai
-from letta.agents.base_agent import BaseAgent
+from letta.agents.helpers import _create_letta_response, serialize_message_history
+from letta.agents.letta_agent import LettaAgent
+from letta.orm.enums import ToolType
 from letta.schemas.agent import AgentState
 from letta.schemas.block import BlockUpdate
 from letta.schemas.enums import MessageStreamStatus
 from letta.schemas.letta_message import LegacyLettaMessage, LettaMessage
-from letta.schemas.letta_message_content import TextContent
 from letta.schemas.letta_response import LettaResponse
-from letta.schemas.message import Message, MessageCreate, ToolReturn
-from letta.schemas.openai.chat_completion_request import ChatCompletionRequest, Tool, UserMessage
-from letta.schemas.usage import LettaUsageStatistics
+from letta.schemas.message import MessageCreate
+from letta.schemas.tool_rule import ChildToolRule, ContinueToolRule, InitToolRule, TerminalToolRule
 from letta.schemas.user import User
-from letta.server.rest_api.utils import convert_in_context_letta_messages_to_openai, create_input_messages
 from letta.services.agent_manager import AgentManager
 from letta.services.block_manager import BlockManager
 from letta.services.message_manager import MessageManager
-from letta.system import package_function_response
+from letta.services.passage_manager import PassageManager
+from letta.services.summarizer.enums import SummarizationMode
+from letta.services.summarizer.summarizer import Summarizer
+from letta.tracing import trace_method
-# TODO: Move this to the new Letta Agent loop
-class VoiceSleeptimeAgent(BaseAgent):
+class VoiceSleeptimeAgent(LettaAgent):
     """
-    A stateless agent that helps with offline memory computations.
+    A special variant of the LettaAgent that helps with offline memory computations specifically for voice.
     """
     def __init__(
         self,
         agent_id: str,
         convo_agent_state: AgentState,
-        openai_client: openai.AsyncClient,
         message_manager: MessageManager,
         agent_manager: AgentManager,
         block_manager: BlockManager,
+        passage_manager: PassageManager,
         target_block_label: str,
-        message_transcripts: List[str],
         actor: User,
     ):
         super().__init__(
             agent_id=agent_id,
-            openai_client=openai_client,
             message_manager=message_manager,
             agent_manager=agent_manager,
+            block_manager=block_manager,
+            passage_manager=passage_manager,
             actor=actor,
         )
         self.convo_agent_state = convo_agent_state
-        self.block_manager = block_manager
         self.target_block_label = target_block_label
-        self.message_transcripts = message_transcripts
+        self.message_transcripts = []
+        self.summarizer = Summarizer(
+            mode=SummarizationMode.STATIC_MESSAGE_BUFFER,
+            summarizer_agent=None,
+            message_buffer_limit=20,
+            message_buffer_min=10,
+        )
     def update_message_transcript(self, message_transcripts: List[str]):
         self.message_transcripts = message_transcripts
-    async def step(self, input_messages: List[MessageCreate], max_steps: int = 10) -> LettaResponse:
+    async def step(self, input_messages: List[MessageCreate], max_steps: int = 20) -> LettaResponse:
         """
         Process the user's input message, allowing the model to call memory-related tools
         until it decides to stop and provide a final response.
         """
-        agent_state = self.agent_manager.get_agent_by_id(agent_id=self.agent_id, actor=self.actor)
-        in_context_messages = create_input_messages(input_messages=input_messages, agent_id=self.agent_id, actor=self.actor)
-        openai_messages = convert_in_context_letta_messages_to_openai(in_context_messages, exclude_system_messages=True)
-        # 1. Store memories
-        request = self._build_openai_request(openai_messages, agent_state, tools=self._build_store_memory_tool_schemas())
-        chat_completion = await self.openai_client.chat.completions.create(**request.model_dump(exclude_unset=True))
-        assistant_message = chat_completion.choices[0].message
-        # Process tool calls
-        tool_call = assistant_message.tool_calls[0]
-        function_name = tool_call.function.name
-        function_args = json.loads(tool_call.function.arguments)
-        if function_name == "store_memories":
-            print("Called store_memories")
-            print(function_args)
-            chunks = function_args.get("chunks", [])
-            results = [self.store_memory(agent_state=self.convo_agent_state, **chunk_args) for chunk_args in chunks]
-            aggregated_result = next((res for res, _ in results if res is not None), None)
-            aggregated_success = all(success for _, success in results)
-        else:
-            raise ValueError("Error: Unknown tool function '{function_name}'")
+        agent_state = self.agent_manager.get_agent_by_id(self.agent_id, actor=self.actor)
+        # Add tool rules to the agent_state specifically for this type of agent
+        agent_state.tool_rules = [
+            InitToolRule(tool_name="store_memories"),
+            ChildToolRule(tool_name="store_memories", children=["rethink_user_memory"]),
+            ContinueToolRule(tool_name="rethink_user_memory"),
+            TerminalToolRule(tool_name="finish_rethinking_memory"),
+        ]
-        assistant_message = {
-            "role": "assistant",
-            "content": assistant_message.content,
-            "tool_calls": [
-                {
-                    "id": tool_call.id,
-                    "type": "function",
-                    "function": {"name": function_name, "arguments": tool_call.function.arguments},
-                }
-            ],
-        }
-        openai_messages.append(assistant_message)
-        in_context_messages.append(
-            Message.dict_to_message(
-                agent_id=self.agent_id,
-                openai_message_dict=assistant_message,
-                model=agent_state.llm_config.model,
-                name=function_name,
-            )
+        # Summarize
+        current_in_context_messages, new_in_context_messages = await super()._step(
+            agent_state=agent_state, input_messages=input_messages, max_steps=max_steps
         )
-        tool_call_message = {
-            "role": "tool",
-            "tool_call_id": tool_call.id,
-            "content": package_function_response(was_success=aggregated_success, response_string=str(aggregated_result)),
-        }
-        openai_messages.append(tool_call_message)
-        in_context_messages.append(
-            Message.dict_to_message(
-                agent_id=self.agent_id,
-                openai_message_dict=tool_call_message,
-                model=agent_state.llm_config.model,
-                name=function_name,
-                tool_returns=[ToolReturn(status="success" if aggregated_success else "error")],
-            )
+        new_in_context_messages, updated = self.summarizer.summarize(
+            in_context_messages=current_in_context_messages, new_letta_messages=new_in_context_messages
         )
-        # 2. Execute rethink block memory loop
-        human_block_content = self.agent_manager.get_block_with_label(
-            agent_id=self.agent_id, block_label=self.target_block_label, actor=self.actor
+        self.agent_manager.set_in_context_messages(
+            agent_id=self.agent_id, message_ids=[m.id for m in new_in_context_messages], actor=self.actor
         )
-        rethink_command = f"""
-        Here is the current memory block created earlier:
-### CURRENT MEMORY
-{human_block_content}
-### END CURRENT MEMORY
-Please refine this block:
-- Merge in any new facts and remove outdated or contradictory details.
-- Organize related information together (e.g., preferences, background, ongoing goals).
-- Add any light, supportable inferences that deepen understanding—but do not invent unsupported details.
+        return _create_letta_response(new_in_context_messages=new_in_context_messages, use_assistant_message=self.use_assistant_message)
-Use `rethink_user_memory(new_memory)` as many times as you need to iteratively improve the text. When it’s fully polished and complete, call `finish_rethinking_memory()`.
+    @trace_method
+    async def _execute_tool(self, tool_name: str, tool_args: dict, agent_state: AgentState) -> Tuple[str, bool]:
         """
-        rethink_command = UserMessage(content=rethink_command)
-        openai_messages.append(rethink_command.model_dump())
-        for _ in range(max_steps):
-            request = self._build_openai_request(openai_messages, agent_state, tools=self._build_sleeptime_tools())
-            chat_completion = await self.openai_client.chat.completions.create(**request.model_dump(exclude_unset=True))
-            assistant_message = chat_completion.choices[0].message
-            # Process tool calls
-            tool_call = assistant_message.tool_calls[0]
-            function_name = tool_call.function.name
-            function_args = json.loads(tool_call.function.arguments)
-            if function_name == "rethink_user_memory":
-                print("Called rethink_user_memory")
-                print(function_args)
-                result, success = self.rethink_user_memory(agent_state=agent_state, **function_args)
-            elif function_name == "finish_rethinking_memory":
-                print("Called finish_rethinking_memory")
-                result, success = None, True
-                break
-            else:
-                print(f"Error: Unknown tool function '{function_name}'")
-                raise ValueError(f"Error: Unknown tool function '{function_name}'", False)
-            assistant_message = {
-                "role": "assistant",
-                "content": assistant_message.content,
-                "tool_calls": [
-                    {
-                        "id": tool_call.id,
-                        "type": "function",
-                        "function": {"name": function_name, "arguments": tool_call.function.arguments},
-                    }
-                ],
-            }
-            openai_messages.append(assistant_message)
-            in_context_messages.append(
-                Message.dict_to_message(
-                    agent_id=self.agent_id,
-                    openai_message_dict=assistant_message,
-                    model=agent_state.llm_config.model,
-                    name=function_name,
-                )
-            )
-            tool_call_message = {
-                "role": "tool",
-                "tool_call_id": tool_call.id,
-                "content": package_function_response(was_success=success, response_string=str(result)),
-            }
-            openai_messages.append(tool_call_message)
-            in_context_messages.append(
-                Message.dict_to_message(
-                    agent_id=self.agent_id,
-                    openai_message_dict=tool_call_message,
-                    model=agent_state.llm_config.model,
-                    name=function_name,
-                    tool_returns=[ToolReturn(status="success" if success else "error")],
-                )
-            )
-        # Actually save the memory:
-        target_block = agent_state.memory.get_block(self.target_block_label)
-        self.block_manager.update_block(block_id=target_block.id, block_update=BlockUpdate(value=target_block.value), actor=self.actor)
-        self.message_manager.create_many_messages(pydantic_msgs=in_context_messages, actor=self.actor)
-        return LettaResponse(messages=[msg for m in in_context_messages for msg in m.to_letta_messages()], usage=LettaUsageStatistics())
-    def _format_messages_llm_friendly(self):
-        messages = self.message_manager.list_messages_for_agent(agent_id=self.agent_id, actor=self.actor)
-        llm_friendly_messages = [f"{m.role}: {m.content[0].text}" for m in messages if m.content and isinstance(m.content[0], TextContent)]
-        return "\n".join(llm_friendly_messages)
-    def _build_openai_request(self, openai_messages: List[Dict], agent_state: AgentState, tools: List[Tool]) -> ChatCompletionRequest:
-        openai_request = ChatCompletionRequest(
-            model=agent_state.llm_config.model,  # TODO: Separate config for summarizer?
-            messages=openai_messages,
-            tools=tools,
-            tool_choice="required",
-            user=self.actor.id,
-            max_completion_tokens=agent_state.llm_config.max_tokens,
-            temperature=agent_state.llm_config.temperature,
-            stream=False,
-        )
-        return openai_request
-    def _build_store_memory_tool_schemas(self) -> List[Tool]:
-        """
-        Build the schemas for the three memory-related tools.
+        Executes a tool and returns (result, success_flag).
         """
-        tools = [
-            Tool(
-                type="function",
-                function={
-                    "name": "store_memories",
-                    "description": "Archive coherent chunks of dialogue that will be evicted, preserving raw lines and a brief contextual description.",
-                    "parameters": {
-                        "type": "object",
-                        "properties": {
-                            "chunks": {
-                                "type": "array",
-                                "items": {
-                                    "type": "object",
-                                    "properties": {
-                                        "start_index": {"type": "integer", "description": "Index of first line in original history."},
-                                        "end_index": {"type": "integer", "description": "Index of last line in original history."},
-                                        "context": {
-                                            "type": "string",
-                                            "description": "A high-level description providing context for why this chunk matters.",
-                                        },
-                                    },
-                                    "required": ["start_index", "end_index", "context"],
-                                },
-                            }
-                        },
-                        "required": ["chunks"],
-                        "additionalProperties": False,
-                    },
-                },
-            ),
-        ]
-        return tools
+        # Special memory case
+        target_tool = next((x for x in agent_state.tools if x.name == tool_name), None)
+        if not target_tool:
+            return f"Tool not found: {tool_name}", False
-    def _build_sleeptime_tools(self) -> List[Tool]:
-        tools = [
-            Tool(
-                type="function",
-                function={
-                    "name": "rethink_user_memory",
-                    "description": (
-                        "Rewrite memory block for the main agent, new_memory should contain all current "
-                        "information from the block that is not outdated or inconsistent, integrating any "
-                        "new information, resulting in a new memory block that is organized, readable, and "
-                        "comprehensive."
-                    ),
-                    "parameters": {
-                        "type": "object",
-                        "properties": {
-                            "new_memory": {
-                                "type": "string",
-                                "description": (
-                                    "The new memory with information integrated from the memory block. "
-                                    "If there is no new information, then this should be the same as the "
-                                    "content in the source block."
-                                ),
-                            },
-                        },
-                        "required": ["new_memory"],
-                        "additionalProperties": False,
-                    },
-                },
-            ),
-            Tool(
-                type="function",
-                function={
-                    "name": "finish_rethinking_memory",
-                    "description": ("This function is called when the agent is done rethinking the memory."),
-                    "parameters": {
-                        "type": "object",
-                        "properties": {},
-                        "required": [],
-                        "additionalProperties": False,
-                    },
-                },
-            ),
-        ]
-        return tools
+        try:
+            if target_tool.name == "rethink_user_memory" and target_tool.tool_type == ToolType.LETTA_VOICE_SLEEPTIME_CORE:
+                return self.rethink_user_memory(agent_state=agent_state, **tool_args)
+            elif target_tool.name == "finish_rethinking_memory" and target_tool.tool_type == ToolType.LETTA_VOICE_SLEEPTIME_CORE:
+                return "", True
+            elif target_tool.name == "store_memories" and target_tool.tool_type == ToolType.LETTA_VOICE_SLEEPTIME_CORE:
+                chunks = tool_args.get("chunks", [])
+                results = [self.store_memory(agent_state=self.convo_agent_state, **chunk_args) for chunk_args in chunks]
+                aggregated_result = next((res for res, _ in results if res is not None), None)
+                aggregated_success = all(success for _, success in results)
+                return aggregated_result, aggregated_success  # Note that here we store to the convo agent's archival memory
+            else:
+                result = f"Voice sleeptime agent tried invoking invalid tool with type {target_tool.tool_type}: {target_tool}"
+                return result, False
+        except Exception as e:
+            return f"Failed to call tool. Error: {e}", False
-    def rethink_user_memory(self, new_memory: str, agent_state: AgentState) -> Tuple[Optional[str], bool]:
+    def rethink_user_memory(self, new_memory: str, agent_state: AgentState) -> Tuple[str, bool]:
         if agent_state.memory.get_block(self.target_block_label) is None:
             agent_state.memory.create_block(label=self.target_block_label, value=new_memory)
         agent_state.memory.update_block_value(label=self.target_block_label, value=new_memory)
-        return None, True
-    def store_memory(self, start_index: int, end_index: int, context: str, agent_state: AgentState) -> Tuple[Optional[str], bool]:
+        target_block = agent_state.memory.get_block(self.target_block_label)
+        self.block_manager.update_block(block_id=target_block.id, block_update=BlockUpdate(value=target_block.value), actor=self.actor)
+        return "", True
+    def store_memory(self, start_index: int, end_index: int, context: str, agent_state: AgentState) -> Tuple[str, bool]:
         """
         Store a memory.
         """
         try:
             messages = self.message_transcripts[start_index : end_index + 1]
-            memory = self.serialize(messages, context)
+            memory = serialize_message_history(messages, context)
             self.agent_manager.passage_manager.insert_passage(
                 agent_state=agent_state,
                 agent_id=agent_state.id,
@@ -335,63 +141,12 @@ Use `rethink_user_memory(new_memory)` as many times as you need to iteratively i
             )
             self.agent_manager.rebuild_system_prompt(agent_id=agent_state.id, actor=self.actor, force=True)
-            return None, True
+            return "", True
         except Exception as e:
             return f"Failed to store memory given start_index {start_index} and end_index {end_index}: {e}", False
-    def serialize(self, messages: List[str], context: str) -> str:
-        """
-        Produce an XML document like:
-        <memory>
-          <messages>
-            <message>…</message>
-            <message>…</message>
-            …
-          </messages>
-          <context>…</context>
-        </memory>
-        """
-        root = ET.Element("memory")
-        msgs_el = ET.SubElement(root, "messages")
-        for msg in messages:
-            m = ET.SubElement(msgs_el, "message")
-            m.text = msg
-        sum_el = ET.SubElement(root, "context")
-        sum_el.text = context
-        # ET.tostring will escape reserved chars for you
-        return ET.tostring(root, encoding="unicode")
-    def deserialize(self, xml_str: str) -> Tuple[List[str], str]:
-        """
-        Parse the XML back into (messages, context). Raises ValueError if tags are missing.
-        """
-        try:
-            root = ET.fromstring(xml_str)
-        except ET.ParseError as e:
-            raise ValueError(f"Invalid XML: {e}")
-        msgs_el = root.find("messages")
-        if msgs_el is None:
-            raise ValueError("Missing <messages> section")
-        messages = []
-        for m in msgs_el.findall("message"):
-            # .text may be None if empty, so coerce to empty string
-            messages.append(m.text or "")
-        sum_el = root.find("context")
-        if sum_el is None:
-            raise ValueError("Missing <context> section")
-        context = sum_el.text or ""
-        return messages, context
     async def step_stream(
-        self, input_messages: List[MessageCreate], max_steps: int = 10
+        self, input_messages: List[MessageCreate], max_steps: int = 10, use_assistant_message: bool = False
     ) -> AsyncGenerator[Union[LettaMessage, LegacyLettaMessage, MessageStreamStatus], None]:
         """
         This agent is synchronous-only. If called in an async context, raise an error.

letta/functions/function_sets/multi_agent.py CHANGED Viewed

@@ -68,7 +68,7 @@ def send_message_to_agent_async(self: "Agent", message: str, other_agent_id: str
         messages=messages,
         other_agent_id=other_agent_id,
         log_prefix="[send_message_to_agent_async]",
-        use_retries=False,  # or True if you want to use async_send_message_with_retries
+        use_retries=False,  # or True if you want to use _async_send_message_with_retries
     )
     # Immediately return to caller

letta/functions/function_sets/voice.py CHANGED Viewed

@@ -6,15 +6,10 @@ from pydantic import BaseModel, Field
 def rethink_user_memory(agent_state: "AgentState", new_memory: str) -> None:
     """
-    Rewrite memory block for the main agent, new_memory should contain all current
-    information from the block that is not outdated or inconsistent, integrating any
-    new information, resulting in a new memory block that is organized, readable, and
-    comprehensive.
+    Rewrite memory block for the main agent, new_memory should contain all current information from the block that is not outdated or inconsistent, integrating any new information, resulting in a new memory block that is organized, readable, and comprehensive.
     Args:
-        new_memory (str): The new memory with information integrated from the memory block.
-                          If there is no new information, then this should be the same as
-                          the content in the source block.
+        new_memory (str): The new memory with information integrated from the memory block. If there is no new information, then this should be the same as the content in the source block.
     Returns:
         None: None is always returned as this function does not produce a response.
@@ -34,26 +29,27 @@ def finish_rethinking_memory(agent_state: "AgentState") -> None:  # type: ignore
 class MemoryChunk(BaseModel):
-    start_index: int = Field(..., description="Index of the first line in the original conversation history.")
-    end_index: int = Field(..., description="Index of the last line in the original conversation history.")
-    context: str = Field(..., description="A concise, high-level note explaining why this chunk matters.")
+    start_index: int = Field(
+        ...,
+        description="Zero-based index of the first evicted line in this chunk.",
+    )
+    end_index: int = Field(
+        ...,
+        description="Zero-based index of the last evicted line (inclusive).",
+    )
+    context: str = Field(
+        ...,
+        description="1-3 sentence paraphrase capturing key facts/details, user preferences, or goals that this chunk reveals—written for future retrieval.",
+    )
 def store_memories(agent_state: "AgentState", chunks: List[MemoryChunk]) -> None:
     """
-    Archive coherent chunks of dialogue that will be evicted, preserving raw lines
-    and a brief contextual description.
+    Persist dialogue that is about to fall out of the agent’s context window.
     Args:
-        agent_state (AgentState):
-            The agent’s current memory state, exposing both its in-session history
-            and the archival memory API.
         chunks (List[MemoryChunk]):
-            A list of MemoryChunk models, each representing a segment to archive:
-              • start_index (int): Index of the first line in the original history.
-              • end_index   (int): Index of the last line in the original history.
-              • context     (str): A concise, high-level description of why this chunk
-                                 matters and what it contains.
+            Each chunk pinpoints a contiguous block of **evicted** lines and provides a short, forward-looking synopsis (`context`) that will be embedded for future semantic lookup.
     Returns:
         None
@@ -69,20 +65,12 @@ def search_memory(
     end_minutes_ago: Optional[int],
 ) -> Optional[str]:
     """
-    Look in long-term or earlier-conversation memory only when the user asks about
-    something missing from the visible context. The user’s latest utterance is sent
-    automatically as the main query.
+    Look in long-term or earlier-conversation memory only when the user asks about something missing from the visible context. The user’s latest utterance is sent automatically as the main query.
     Args:
-        agent_state (AgentState): The current state of the agent, including its
-            memory stores and context.
-        convo_keyword_queries (Optional[List[str]]): Extra keywords or identifiers
-            (e.g., order ID, place name) to refine the search when the request is vague.
-            Set to None if the user’s utterance is already specific.
-        start_minutes_ago (Optional[int]): Newer bound of the time window for results,
-            specified in minutes ago. Set to None if no lower time bound is needed.
-        end_minutes_ago (Optional[int]): Older bound of the time window for results,
-            specified in minutes ago. Set to None if no upper time bound is needed.
+        convo_keyword_queries (Optional[List[str]]): Extra keywords (e.g., order ID, place name). Use *null* if not appropriate for the latest user message.
+        start_minutes_ago (Optional[int]): Newer bound of the time window for results, specified in minutes ago. Use *null* if no lower time bound is needed.
+        end_minutes_ago (Optional[int]): Older bound of the time window, in minutes ago. Use *null* if no upper bound is needed.
     Returns:
         Optional[str]: A formatted string of matching memory entries, or None if no

letta/functions/helpers.py CHANGED Viewed

@@ -231,7 +231,7 @@ async def async_execute_send_message_to_agent(
     """
     Async helper to:
       1) validate the target agent exists & is in the same org,
-      2) send a message via async_send_message_with_retries.
+      2) send a message via _async_send_message_with_retries.
     """
     server = get_letta_server()
@@ -242,7 +242,7 @@ async def async_execute_send_message_to_agent(
         raise ValueError(f"Target agent {other_agent_id} either does not exist or is not in org " f"({sender_agent.user.organization_id}).")
     # 2. Use your async retry logic
-    return await async_send_message_with_retries(
+    return await _async_send_message_with_retries(
         server=server,
         sender_agent=sender_agent,
         target_agent_id=other_agent_id,
@@ -304,7 +304,7 @@ async def _async_send_message_with_retries(
     timeout: int,
     logging_prefix: Optional[str] = None,
 ) -> str:
-    logging_prefix = logging_prefix or "[async_send_message_with_retries]"
+    logging_prefix = logging_prefix or "[_async_send_message_with_retries]"
     for attempt in range(1, max_retries + 1):
         try:
@@ -363,7 +363,7 @@ def fire_and_forget_send_to_agent(
         messages (List[MessageCreate]): The messages to send.
         other_agent_id (str): The ID of the target agent.
         log_prefix (str): Prefix for logging.
-        use_retries (bool): If True, uses async_send_message_with_retries;
+        use_retries (bool): If True, uses _async_send_message_with_retries;
                             if False, calls server.send_message_to_agent directly.
     """
     server = get_letta_server()
@@ -381,7 +381,7 @@ def fire_and_forget_send_to_agent(
     async def background_task():
         try:
             if use_retries:
-                result = await async_send_message_with_retries(
+                result = await _async_send_message_with_retries(
                     server=server,
                     sender_agent=sender_agent,
                     target_agent_id=other_agent_id,
@@ -434,7 +434,7 @@ async def _send_message_to_agents_matching_tags_async(
     sender_agent: "Agent", server: "SyncServer", messages: List[MessageCreate], matching_agents: List["AgentState"]
 ) -> List[str]:
     async def _send_single(agent_state):
-        return await async_send_message_with_retries(
+        return await _async_send_message_with_retries(
             server=server,
             sender_agent=sender_agent,
             target_agent_id=agent_state.id,
@@ -475,7 +475,7 @@ async def _send_message_to_all_agents_in_group_async(sender_agent: "Agent", mess
     async def _send_single(agent_state):
         async with sem:
-            return await async_send_message_with_retries(
+            return await _async_send_message_with_retries(
                 server=server,
                 sender_agent=sender_agent,
                 target_agent_id=agent_state.id,

letta/helpers/datetime_helpers.py CHANGED Viewed

@@ -1,4 +1,5 @@
 import re
+import time
 from datetime import datetime, timedelta, timezone
 from time import strftime
@@ -77,6 +78,11 @@ def get_utc_time_int() -> int:
     return int(get_utc_time().timestamp())
+def get_utc_timestamp_ns() -> int:
+    """Get the current UTC time in nanoseconds"""
+    return int(time.time_ns())
 def timestamp_to_datetime(timestamp_seconds: int) -> datetime:
     """Convert Unix timestamp in seconds to UTC datetime object"""
     return datetime.fromtimestamp(timestamp_seconds, tz=timezone.utc)

letta-nightly 0.7.8.dev20250502104219__py3-none-any.whl → 0.7.9.dev20250502222710__py3-none-any.whl

letta-nightly 0.7.8.dev20250502104219py3-none-any.whl → 0.7.9.dev20250502222710py3-none-any.whl