PyPI - letta-nightly - Versions diffs - 0.11.7.dev20251007104119__py3-none-any.whl → 0.12.0.dev20251009104148__py3-none-any.whl - Mend

letta-nightly 0.11.7.dev20251007104119py3-none-any.whl → 0.12.0.dev20251009104148py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (151) hide show

letta/__init__.py +1 -1
letta/adapters/letta_llm_adapter.py +1 -0
letta/adapters/letta_llm_request_adapter.py +0 -1
letta/adapters/letta_llm_stream_adapter.py +7 -2
letta/adapters/simple_llm_request_adapter.py +88 -0
letta/adapters/simple_llm_stream_adapter.py +192 -0
letta/agents/agent_loop.py +6 -0
letta/agents/ephemeral_summary_agent.py +2 -1
letta/agents/helpers.py +142 -6
letta/agents/letta_agent.py +13 -33
letta/agents/letta_agent_batch.py +2 -4
letta/agents/letta_agent_v2.py +87 -77
letta/agents/letta_agent_v3.py +927 -0
letta/agents/voice_agent.py +2 -6
letta/constants.py +8 -4
letta/database_utils.py +161 -0
letta/errors.py +40 -0
letta/functions/function_sets/base.py +84 -4
letta/functions/function_sets/multi_agent.py +0 -3
letta/functions/schema_generator.py +113 -71
letta/groups/dynamic_multi_agent.py +3 -2
letta/groups/helpers.py +1 -2
letta/groups/round_robin_multi_agent.py +3 -2
letta/groups/sleeptime_multi_agent.py +3 -2
letta/groups/sleeptime_multi_agent_v2.py +1 -1
letta/groups/sleeptime_multi_agent_v3.py +17 -17
letta/groups/supervisor_multi_agent.py +84 -80
letta/helpers/converters.py +3 -0
letta/helpers/message_helper.py +4 -0
letta/helpers/tool_rule_solver.py +92 -5
letta/interfaces/anthropic_streaming_interface.py +409 -0
letta/interfaces/gemini_streaming_interface.py +296 -0
letta/interfaces/openai_streaming_interface.py +752 -1
letta/llm_api/anthropic_client.py +127 -16
letta/llm_api/bedrock_client.py +4 -2
letta/llm_api/deepseek_client.py +4 -1
letta/llm_api/google_vertex_client.py +124 -42
letta/llm_api/groq_client.py +4 -1
letta/llm_api/llm_api_tools.py +11 -4
letta/llm_api/llm_client_base.py +6 -2
letta/llm_api/openai.py +32 -2
letta/llm_api/openai_client.py +423 -18
letta/llm_api/xai_client.py +4 -1
letta/main.py +9 -5
letta/memory.py +1 -0
letta/orm/__init__.py +2 -1
letta/orm/agent.py +10 -0
letta/orm/block.py +7 -16
letta/orm/blocks_agents.py +8 -2
letta/orm/files_agents.py +2 -0
letta/orm/job.py +7 -5
letta/orm/mcp_oauth.py +1 -0
letta/orm/message.py +21 -6
letta/orm/organization.py +2 -0
letta/orm/provider.py +6 -2
letta/orm/run.py +71 -0
letta/orm/run_metrics.py +82 -0
letta/orm/sandbox_config.py +7 -1
letta/orm/sqlalchemy_base.py +0 -306
letta/orm/step.py +6 -5
letta/orm/step_metrics.py +5 -5
letta/otel/tracing.py +28 -3
letta/plugins/defaults.py +4 -4
letta/prompts/system_prompts/__init__.py +2 -0
letta/prompts/system_prompts/letta_v1.py +25 -0
letta/schemas/agent.py +3 -2
letta/schemas/agent_file.py +9 -3
letta/schemas/block.py +23 -10
letta/schemas/enums.py +21 -2
letta/schemas/job.py +17 -4
letta/schemas/letta_message_content.py +71 -2
letta/schemas/letta_stop_reason.py +5 -5
letta/schemas/llm_config.py +53 -3
letta/schemas/memory.py +1 -1
letta/schemas/message.py +564 -117
letta/schemas/openai/responses_request.py +64 -0
letta/schemas/providers/__init__.py +2 -0
letta/schemas/providers/anthropic.py +16 -0
letta/schemas/providers/ollama.py +115 -33
letta/schemas/providers/openrouter.py +52 -0
letta/schemas/providers/vllm.py +2 -1
letta/schemas/run.py +48 -42
letta/schemas/run_metrics.py +21 -0
letta/schemas/step.py +2 -2
letta/schemas/step_metrics.py +1 -1
letta/schemas/tool.py +15 -107
letta/schemas/tool_rule.py +88 -5
letta/serialize_schemas/marshmallow_agent.py +1 -0
letta/server/db.py +79 -408
letta/server/rest_api/app.py +61 -10
letta/server/rest_api/dependencies.py +14 -0
letta/server/rest_api/redis_stream_manager.py +19 -8
letta/server/rest_api/routers/v1/agents.py +364 -292
letta/server/rest_api/routers/v1/blocks.py +14 -20
letta/server/rest_api/routers/v1/identities.py +45 -110
letta/server/rest_api/routers/v1/internal_templates.py +21 -0
letta/server/rest_api/routers/v1/jobs.py +23 -6
letta/server/rest_api/routers/v1/messages.py +1 -1
letta/server/rest_api/routers/v1/runs.py +149 -99
letta/server/rest_api/routers/v1/sandbox_configs.py +10 -19
letta/server/rest_api/routers/v1/tools.py +281 -594
letta/server/rest_api/routers/v1/voice.py +1 -1
letta/server/rest_api/streaming_response.py +29 -29
letta/server/rest_api/utils.py +122 -64
letta/server/server.py +160 -887
letta/services/agent_manager.py +236 -919
letta/services/agent_serialization_manager.py +16 -0
letta/services/archive_manager.py +0 -100
letta/services/block_manager.py +211 -168
letta/services/context_window_calculator/token_counter.py +1 -1
letta/services/file_manager.py +1 -1
letta/services/files_agents_manager.py +24 -33
letta/services/group_manager.py +0 -142
letta/services/helpers/agent_manager_helper.py +7 -2
letta/services/helpers/run_manager_helper.py +69 -0
letta/services/job_manager.py +96 -411
letta/services/lettuce/__init__.py +6 -0
letta/services/lettuce/lettuce_client_base.py +86 -0
letta/services/mcp_manager.py +38 -6
letta/services/message_manager.py +165 -362
letta/services/organization_manager.py +0 -36
letta/services/passage_manager.py +0 -345
letta/services/provider_manager.py +0 -80
letta/services/run_manager.py +364 -0
letta/services/sandbox_config_manager.py +0 -234
letta/services/step_manager.py +62 -39
letta/services/summarizer/summarizer.py +9 -7
letta/services/telemetry_manager.py +0 -16
letta/services/tool_executor/builtin_tool_executor.py +35 -0
letta/services/tool_executor/core_tool_executor.py +397 -2
letta/services/tool_executor/files_tool_executor.py +3 -3
letta/services/tool_executor/multi_agent_tool_executor.py +30 -15
letta/services/tool_executor/tool_execution_manager.py +6 -8
letta/services/tool_executor/tool_executor_base.py +3 -3
letta/services/tool_manager.py +85 -339
letta/services/tool_sandbox/base.py +24 -13
letta/services/tool_sandbox/e2b_sandbox.py +16 -1
letta/services/tool_schema_generator.py +123 -0
letta/services/user_manager.py +0 -99
letta/settings.py +20 -4
letta/system.py +5 -1
{letta_nightly-0.11.7.dev20251007104119.dist-info → letta_nightly-0.12.0.dev20251009104148.dist-info}/METADATA +3 -5
{letta_nightly-0.11.7.dev20251007104119.dist-info → letta_nightly-0.12.0.dev20251009104148.dist-info}/RECORD +146 -135
letta/agents/temporal/activities/__init__.py +0 -4
letta/agents/temporal/activities/example_activity.py +0 -7
letta/agents/temporal/activities/prepare_messages.py +0 -10
letta/agents/temporal/temporal_agent_workflow.py +0 -56
letta/agents/temporal/types.py +0 -25
{letta_nightly-0.11.7.dev20251007104119.dist-info → letta_nightly-0.12.0.dev20251009104148.dist-info}/WHEEL +0 -0
{letta_nightly-0.11.7.dev20251007104119.dist-info → letta_nightly-0.12.0.dev20251009104148.dist-info}/entry_points.txt +0 -0
{letta_nightly-0.11.7.dev20251007104119.dist-info → letta_nightly-0.12.0.dev20251009104148.dist-info}/licenses/LICENSE +0 -0

letta/services/step_manager.py CHANGED Viewed

@@ -8,7 +8,6 @@ from sqlalchemy.orm import Session
 from letta.helpers.singleton import singleton
 from letta.orm.errors import NoResultFound
-from letta.orm.job import Job as JobModel
 from letta.orm.message import Message as MessageModel
 from letta.orm.sqlalchemy_base import AccessType
 from letta.orm.step import Step as StepModel
@@ -48,6 +47,7 @@ class StepManager:
         feedback: Optional[Literal["positive", "negative"]] = None,
         has_feedback: Optional[bool] = None,
         project_id: Optional[str] = None,
+        run_id: Optional[str] = None,
     ) -> List[PydanticStep]:
         """List all jobs with optional pagination and status filter."""
         async with db_registry.async_session() as session:
@@ -62,6 +62,8 @@ class StepManager:
                 filter_kwargs["feedback"] = feedback
             if project_id:
                 filter_kwargs["project_id"] = project_id
+            if run_id:
+                filter_kwargs["run_id"] = run_id
             steps = await StepModel.list_async(
                 db_session=session,
                 before=before,
@@ -88,7 +90,7 @@ class StepManager:
         context_window_limit: int,
         usage: UsageStatistics,
         provider_id: Optional[str] = None,
-        job_id: Optional[str] = None,
+        run_id: Optional[str] = None,
         step_id: Optional[str] = None,
         project_id: Optional[str] = None,
         stop_reason: Optional[LettaStopReason] = None,
@@ -109,7 +111,7 @@ class StepManager:
             "completion_tokens": usage.completion_tokens,
             "prompt_tokens": usage.prompt_tokens,
             "total_tokens": usage.total_tokens,
-            "job_id": job_id,
+            "run_id": run_id,
             "tags": [],
             "tid": None,
             "trace_id": get_trace_id(),  # Get the current trace ID
@@ -123,8 +125,8 @@ class StepManager:
         if stop_reason:
             step_data["stop_reason"] = stop_reason.stop_reason
         with db_registry.session() as session:
-            if job_id:
-                self._verify_job_access(session, job_id, actor, access=["write"])
+            if run_id:
+                self._verify_run_access(session, run_id, actor, access=["write"])
             new_step = StepModel(**step_data)
             new_step.create(session)
             return new_step.to_pydantic()
@@ -142,13 +144,14 @@ class StepManager:
         context_window_limit: int,
         usage: UsageStatistics,
         provider_id: Optional[str] = None,
-        job_id: Optional[str] = None,
+        run_id: Optional[str] = None,
         step_id: Optional[str] = None,
         project_id: Optional[str] = None,
         stop_reason: Optional[LettaStopReason] = None,
         status: Optional[StepStatus] = None,
         error_type: Optional[str] = None,
         error_data: Optional[Dict] = None,
+        allow_partial: Optional[bool] = False,
     ) -> PydanticStep:
         step_data = {
             "origin": None,
@@ -163,7 +166,7 @@ class StepManager:
             "completion_tokens": usage.completion_tokens,
             "prompt_tokens": usage.prompt_tokens,
             "total_tokens": usage.total_tokens,
-            "job_id": job_id,
+            "run_id": run_id,
             "tags": [],
             "tid": None,
             "trace_id": get_trace_id(),  # Get the current trace ID
@@ -176,7 +179,15 @@ class StepManager:
             step_data["id"] = step_id
         if stop_reason:
             step_data["stop_reason"] = stop_reason.stop_reason
         async with db_registry.async_session() as session:
+            if allow_partial:
+                try:
+                    new_step = await StepModel.read_async(db_session=session, identifier=step_id, actor=actor)
+                    return new_step.to_pydantic()
+                except NoResultFound:
+                    pass
             new_step = StepModel(**step_data)
             await new_step.create_async(session, no_commit=True, no_refresh=True)
             pydantic_step = new_step.to_pydantic()
@@ -420,10 +431,11 @@ class StepManager:
         tool_execution_ns: Optional[int] = None,
         step_ns: Optional[int] = None,
         agent_id: Optional[str] = None,
-        job_id: Optional[str] = None,
+        run_id: Optional[str] = None,
         project_id: Optional[str] = None,
         template_id: Optional[str] = None,
         base_template_id: Optional[str] = None,
+        allow_partial: Optional[bool] = False,
     ) -> PydanticStepMetrics:
         """Record performance metrics for a step.
@@ -434,7 +446,7 @@ class StepManager:
             tool_execution_ns: Time spent on tool execution in nanoseconds
             step_ns: Total time for the step in nanoseconds
             agent_id: The ID of the agent
-            job_id: The ID of the job
+            run_id: The ID of the run
             project_id: The ID of the project
             template_id: The ID of the template
             base_template_id: The ID of the base template
@@ -452,11 +464,18 @@ class StepManager:
             if step.organization_id != actor.organization_id:
                 raise Exception("Unauthorized")
+            if allow_partial:
+                try:
+                    metrics = await StepMetricsModel.read_async(db_session=session, identifier=step_id, actor=actor)
+                    return metrics.to_pydantic()
+                except NoResultFound:
+                    pass
             metrics_data = {
                 "id": step_id,
                 "organization_id": actor.organization_id,
                 "agent_id": agent_id or step.agent_id,
-                "job_id": job_id or step.job_id,
+                "run_id": run_id,
                 "project_id": project_id or step.project_id,
                 "llm_request_ns": llm_request_ns,
                 "tool_execution_ns": tool_execution_ns,
@@ -469,62 +488,66 @@ class StepManager:
             await metrics.create_async(session)
             return metrics.to_pydantic()
-    def _verify_job_access(
+    def _verify_run_access(
         self,
         session: Session,
-        job_id: str,
+        run_id: str,
         actor: PydanticUser,
         access: List[Literal["read", "write", "delete"]] = ["read"],
-    ) -> JobModel:
+    ):
         """
-        Verify that a job exists and the user has the required access.
+        Verify that a run exists and the user has the required access.
         Args:
             session: The database session
-            job_id: The ID of the job to verify
+            run_id: The ID of the run to verify
             actor: The user making the request
         Returns:
-            The job if it exists and the user has access
+            The run if it exists and the user has access
         Raises:
-            NoResultFound: If the job does not exist or user does not have access
+            NoResultFound: If the run does not exist or user does not have access
         """
-        job_query = select(JobModel).where(JobModel.id == job_id)
-        job_query = JobModel.apply_access_predicate(job_query, actor, access, AccessType.USER)
-        job = session.execute(job_query).scalar_one_or_none()
-        if not job:
-            raise NoResultFound(f"Job with id {job_id} does not exist or user does not have access")
-        return job
+        from letta.orm.run import Run as RunModel
+        run_query = select(RunModel).where(RunModel.id == run_id)
+        run_query = RunModel.apply_access_predicate(run_query, actor, access, AccessType.USER)
+        run = session.execute(run_query).scalar_one_or_none()
+        if not run:
+            raise NoResultFound(f"Run with id {run_id} does not exist or user does not have access")
+        return run
     @staticmethod
-    async def _verify_job_access_async(
+    async def _verify_run_access_async(
         session: AsyncSession,
-        job_id: str,
+        run_id: str,
         actor: PydanticUser,
         access: List[Literal["read", "write", "delete"]] = ["read"],
-    ) -> JobModel:
+    ):
         """
-        Verify that a job exists and the user has the required access asynchronously.
+        Verify that a run exists and the user has the required access asynchronously.
         Args:
             session: The async database session
-            job_id: The ID of the job to verify
+            run_id: The ID of the run to verify
             actor: The user making the request
         Returns:
-            The job if it exists and the user has access
+            The run if it exists and the user has access
         Raises:
-            NoResultFound: If the job does not exist or user does not have access
+            NoResultFound: If the run does not exist or user does not have access
         """
-        job_query = select(JobModel).where(JobModel.id == job_id)
-        job_query = JobModel.apply_access_predicate(job_query, actor, access, AccessType.USER)
-        result = await session.execute(job_query)
-        job = result.scalar_one_or_none()
-        if not job:
-            raise NoResultFound(f"Job with id {job_id} does not exist or user does not have access")
-        return job
+        from letta.orm.run import Run as RunModel
+        run_query = select(RunModel).where(RunModel.id == run_id)
+        run_query = RunModel.apply_access_predicate(run_query, actor, access, AccessType.USER)
+        result = await session.execute(run_query)
+        run = result.scalar_one_or_none()
+        if not run:
+            raise NoResultFound(f"Run with id {run_id} does not exist or user does not have access")
+        return run
 # noinspection PyTypeChecker
@@ -549,7 +572,7 @@ class NoopStepManager(StepManager):
         context_window_limit: int,
         usage: UsageStatistics,
         provider_id: Optional[str] = None,
-        job_id: Optional[str] = None,
+        run_id: Optional[str] = None,
         step_id: Optional[str] = None,
         project_id: Optional[str] = None,
         stop_reason: Optional[LettaStopReason] = None,
@@ -572,7 +595,7 @@ class NoopStepManager(StepManager):
         context_window_limit: int,
         usage: UsageStatistics,
         provider_id: Optional[str] = None,
-        job_id: Optional[str] = None,
+        run_id: Optional[str] = None,
         step_id: Optional[str] = None,
         project_id: Optional[str] = None,
         stop_reason: Optional[LettaStopReason] = None,

letta/services/summarizer/summarizer.py CHANGED Viewed

@@ -10,7 +10,7 @@ from letta.llm_api.llm_client import LLMClient
 from letta.log import get_logger
 from letta.otel.tracing import trace_method
 from letta.prompts import gpt_summarize
-from letta.schemas.enums import MessageRole
+from letta.schemas.enums import AgentType, MessageRole
 from letta.schemas.letta_message_content import TextContent
 from letta.schemas.llm_config import LLMConfig
 from letta.schemas.message import Message, MessageCreate
@@ -189,6 +189,7 @@ class Summarizer:
             # We already packed, don't pack again
             wrap_user_message=False,
             wrap_system_message=False,
+            run_id=None,  # TODO: add this
         )[0]
         # Create the message in the DB
@@ -383,17 +384,18 @@ async def simple_summary(messages: List[Message], llm_config: LLMConfig, actor:
             {"role": "user", "content": summary_transcript},
         ]
     input_messages_obj = [simple_message_wrapper(msg) for msg in input_messages]
-    request_data = llm_client.build_request_data(input_messages_obj, llm_config, tools=[])
+    # Build a local LLMConfig for v1-style summarization which uses native content and must not
+    # include inner thoughts in kwargs to avoid conflicts in Anthropic formatting
+    summarizer_llm_config = LLMConfig(**llm_config.model_dump())
+    summarizer_llm_config.put_inner_thoughts_in_kwargs = False
-    # NOTE: we should disable the inner_thoughts_in_kwargs here, because we don't use it
-    # I'm leaving it commented it out for now for safety but is fine assuming the var here is a copy not a reference
-    # llm_config.put_inner_thoughts_in_kwargs = False
+    request_data = llm_client.build_request_data(AgentType.letta_v1_agent, input_messages_obj, summarizer_llm_config, tools=[])
     try:
-        response_data = await llm_client.request_async(request_data, llm_config)
+        response_data = await llm_client.request_async(request_data, summarizer_llm_config)
     except Exception as e:
         # handle LLM error (likely a context window exceeded error)
         raise llm_client.handle_llm_error(e)
-    response = llm_client.convert_response_to_chat_completion(response_data, input_messages_obj, llm_config)
+    response = llm_client.convert_response_to_chat_completion(response_data, input_messages_obj, summarizer_llm_config)
     if response.choices[0].message.content is None:
         logger.warning("No content returned from summarizer")
         # TODO raise an error error instead?

letta/services/telemetry_manager.py CHANGED Viewed

@@ -39,22 +39,6 @@ class TelemetryManager:
             await session.commit()
             return pydantic_provider_trace
-    @enforce_types
-    @trace_method
-    def create_provider_trace(self, actor: PydanticUser, provider_trace_create: ProviderTraceCreate) -> PydanticProviderTrace:
-        with db_registry.session() as session:
-            provider_trace = ProviderTraceModel(**provider_trace_create.model_dump())
-            provider_trace.organization_id = actor.organization_id
-            if provider_trace_create.request_json:
-                request_json_str = json_dumps(provider_trace_create.request_json)
-                provider_trace.request_json = json_loads(request_json_str)
-            if provider_trace_create.response_json:
-                response_json_str = json_dumps(provider_trace_create.response_json)
-                provider_trace.response_json = json_loads(response_json_str)
-            provider_trace.create(session, actor=actor)
-            return provider_trace.to_pydantic()
 @singleton
 class NoopTelemetryManager(TelemetryManager):

letta/services/tool_executor/builtin_tool_executor.py CHANGED Viewed

@@ -209,6 +209,41 @@ class LettaBuiltinToolExecutor(ToolExecutor):
         from readability import Document
         from trafilatura import extract, fetch_url
+        # Try exa first
+        try:
+            from exa_py import Exa
+            agent_state_tool_env_vars = agent_state.get_agent_env_vars_as_dict()
+            exa_api_key = agent_state_tool_env_vars.get("EXA_API_KEY") or tool_settings.exa_api_key
+            if exa_api_key:
+                logger.info(f"[DEBUG] Starting Exa fetch content for url: '{url}'")
+                exa = Exa(api_key=exa_api_key)
+                results = await asyncio.to_thread(
+                    lambda: exa.get_contents(
+                        [url],
+                        text=True,
+                    ).results
+                )
+                if len(results) > 0:
+                    result = results[0]
+                    return json.dumps(
+                        {
+                            "title": result.title,
+                            "published_date": result.published_date,
+                            "author": result.author,
+                            "text": result.text,
+                        }
+                    )
+                else:
+                    logger.info(f"[DEBUG] Exa did not return content for '{url}', falling back to local fetch.")
+            else:
+                logger.info("[DEBUG] No Exa key available, falling back to local fetch.")
+        except ImportError:
+            logger.info("[DEBUG] Exa pip package unavailable, falling back to local fetch.")
+            pass
         try:
             # single thread pool call for the entire trafilatura pipeline
             def trafilatura_pipeline():

letta-nightly 0.11.7.dev20251007104119__py3-none-any.whl → 0.12.0.dev20251009104148__py3-none-any.whl

letta-nightly 0.11.7.dev20251007104119py3-none-any.whl → 0.12.0.dev20251009104148py3-none-any.whl