PyPI - letta-nightly - Versions diffs - 0.11.0.dev20250807104511__py3-none-any.whl → 0.11.0.dev20250808104456__py3-none-any.whl - Mend

letta-nightly 0.11.0.dev20250807104511py3-none-any.whl → 0.11.0.dev20250808104456py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (30) hide show

letta/agent.py +2 -1
letta/agents/letta_agent.py +215 -143
letta/constants.py +4 -1
letta/embeddings.py +6 -5
letta/functions/function_sets/base.py +2 -2
letta/functions/function_sets/files.py +22 -9
letta/interfaces/anthropic_streaming_interface.py +291 -265
letta/interfaces/openai_streaming_interface.py +270 -250
letta/llm_api/anthropic.py +3 -10
letta/llm_api/openai_client.py +6 -1
letta/orm/__init__.py +1 -0
letta/orm/step.py +14 -0
letta/orm/step_metrics.py +71 -0
letta/schemas/enums.py +9 -0
letta/schemas/llm_config.py +8 -6
letta/schemas/providers/lmstudio.py +2 -2
letta/schemas/providers/ollama.py +42 -54
letta/schemas/providers/openai.py +1 -1
letta/schemas/step.py +6 -0
letta/schemas/step_metrics.py +23 -0
letta/schemas/tool_rule.py +10 -29
letta/services/step_manager.py +179 -1
letta/services/tool_executor/builtin_tool_executor.py +4 -1
letta/services/tool_executor/core_tool_executor.py +2 -10
letta/services/tool_executor/files_tool_executor.py +89 -40
{letta_nightly-0.11.0.dev20250807104511.dist-info → letta_nightly-0.11.0.dev20250808104456.dist-info}/METADATA +1 -1
{letta_nightly-0.11.0.dev20250807104511.dist-info → letta_nightly-0.11.0.dev20250808104456.dist-info}/RECORD +30 -28
{letta_nightly-0.11.0.dev20250807104511.dist-info → letta_nightly-0.11.0.dev20250808104456.dist-info}/LICENSE +0 -0
{letta_nightly-0.11.0.dev20250807104511.dist-info → letta_nightly-0.11.0.dev20250808104456.dist-info}/WHEEL +0 -0
{letta_nightly-0.11.0.dev20250807104511.dist-info → letta_nightly-0.11.0.dev20250808104456.dist-info}/entry_points.txt +0 -0

letta/agent.py CHANGED Viewed

@@ -45,7 +45,7 @@ from letta.otel.tracing import log_event, trace_method
 from letta.schemas.agent import AgentState, AgentStepResponse, UpdateAgent, get_prompt_template_for_agent_type
 from letta.schemas.block import BlockUpdate
 from letta.schemas.embedding_config import EmbeddingConfig
-from letta.schemas.enums import MessageRole, ProviderType, ToolType
+from letta.schemas.enums import MessageRole, ProviderType, StepStatus, ToolType
 from letta.schemas.letta_message_content import ImageContent, TextContent
 from letta.schemas.memory import ContextWindowOverview, Memory
 from letta.schemas.message import Message, MessageCreate, ToolReturn
@@ -991,6 +991,7 @@ class Agent(BaseAgent):
                 job_id=job_id,
                 step_id=step_id,
                 project_id=self.agent_state.project_id,
+                status=StepStatus.SUCCESS,  # Set to SUCCESS since we're logging after successful completion
             )
             for message in all_new_messages:
                 message.step_id = step.id

letta/agents/letta_agent.py CHANGED Viewed

@@ -34,7 +34,7 @@ from letta.otel.context import get_ctx_attributes
 from letta.otel.metric_registry import MetricRegistry
 from letta.otel.tracing import log_event, trace_method, tracer
 from letta.schemas.agent import AgentState, UpdateAgent
-from letta.schemas.enums import JobStatus, MessageRole, ProviderType, ToolType
+from letta.schemas.enums import JobStatus, MessageRole, ProviderType, StepStatus, ToolType
 from letta.schemas.letta_message import MessageType
 from letta.schemas.letta_message_content import OmittedReasoningContent, ReasoningContent, RedactedReasoningContent, TextContent
 from letta.schemas.letta_response import LettaResponse
@@ -241,6 +241,26 @@ class LettaAgent(BaseAgent):
             step_progression = StepProgression.START
             should_continue = False
+            # Create step early with PENDING status
+            logged_step = await self.step_manager.log_step_async(
+                actor=self.actor,
+                agent_id=agent_state.id,
+                provider_name=agent_state.llm_config.model_endpoint_type,
+                provider_category=agent_state.llm_config.provider_category or "base",
+                model=agent_state.llm_config.model,
+                model_endpoint=agent_state.llm_config.model_endpoint,
+                context_window_limit=agent_state.llm_config.context_window,
+                usage=UsageStatistics(completion_tokens=0, prompt_tokens=0, total_tokens=0),
+                provider_id=None,
+                job_id=self.current_run_id if self.current_run_id else None,
+                step_id=step_id,
+                project_id=agent_state.project_id,
+                status=StepStatus.PENDING,
+            )
+            # Only use step_id in messages if step was actually created
+            effective_step_id = step_id if logged_step else None
             try:
                 request_data, response_data, current_in_context_messages, new_in_context_messages, valid_tool_names = (
                     await self._build_and_request_from_llm(
@@ -295,13 +315,17 @@ class LettaAgent(BaseAgent):
                     tool_rules_solver,
                     response.usage,
                     reasoning_content=reasoning,
-                    step_id=step_id,
+                    step_id=effective_step_id,
                     initial_messages=initial_messages,
                     agent_step_span=agent_step_span,
                     is_final_step=(i == max_steps - 1),
                 )
                 step_progression = StepProgression.STEP_LOGGED
+                # Update step with actual usage now that we have it (if step was created)
+                if logged_step:
+                    await self.step_manager.update_step_success_async(self.actor, step_id, response.usage, stop_reason)
                 # TODO (cliandy): handle message contexts with larger refactor and dedupe logic
                 new_message_idx = len(initial_messages) if initial_messages else 0
                 self.response_messages.extend(persisted_messages[new_message_idx:])
@@ -321,7 +345,7 @@ class LettaAgent(BaseAgent):
                     provider_trace_create=ProviderTraceCreate(
                         request_json=request_data,
                         response_json=response_data,
-                        step_id=step_id,
+                        step_id=step_id,  # Use original step_id for telemetry
                         organization_id=self.actor.organization_id,
                     ),
                 )
@@ -358,54 +382,57 @@ class LettaAgent(BaseAgent):
             # Update step if it needs to be updated
             finally:
-                if settings.track_stop_reason:
-                    if step_progression == StepProgression.FINISHED and should_continue:
-                        continue
-                    self.logger.debug("Running cleanup for agent loop run: %s", self.current_run_id)
-                    self.logger.info("Running final update. Step Progression: %s", step_progression)
-                    try:
-                        if step_progression == StepProgression.FINISHED and not should_continue:
-                            if stop_reason is None:
-                                stop_reason = LettaStopReason(stop_reason=StopReasonType.end_turn.value)
+                if step_progression == StepProgression.FINISHED and should_continue:
+                    continue
+                self.logger.debug("Running cleanup for agent loop run: %s", self.current_run_id)
+                self.logger.info("Running final update. Step Progression: %s", step_progression)
+                try:
+                    if step_progression == StepProgression.FINISHED and not should_continue:
+                        # Successfully completed - update with final usage and stop reason
+                        if stop_reason is None:
+                            stop_reason = LettaStopReason(stop_reason=StopReasonType.end_turn.value)
+                        # Note: step already updated with success status after _handle_ai_response
+                        if logged_step:
                             await self.step_manager.update_step_stop_reason(self.actor, step_id, stop_reason.stop_reason)
-                            break
+                        break
-                        if step_progression < StepProgression.STEP_LOGGED:
-                            await self.step_manager.log_step_async(
+                    # Handle error cases
+                    if step_progression < StepProgression.STEP_LOGGED:
+                        # Error occurred before step was fully logged
+                        import traceback
+                        if logged_step:
+                            await self.step_manager.update_step_error_async(
                                 actor=self.actor,
-                                agent_id=agent_state.id,
-                                provider_name=agent_state.llm_config.model_endpoint_type,
-                                provider_category=agent_state.llm_config.provider_category or "base",
-                                model=agent_state.llm_config.model,
-                                model_endpoint=agent_state.llm_config.model_endpoint,
-                                context_window_limit=agent_state.llm_config.context_window,
-                                usage=UsageStatistics(completion_tokens=0, prompt_tokens=0, total_tokens=0),
-                                provider_id=None,
-                                job_id=self.current_run_id if self.current_run_id else None,
-                                step_id=step_id,
-                                project_id=agent_state.project_id,
+                                step_id=step_id,  # Use original step_id for telemetry
+                                error_type=type(e).__name__ if "e" in locals() else "Unknown",
+                                error_message=str(e) if "e" in locals() else "Unknown error",
+                                error_traceback=traceback.format_exc(),
                                 stop_reason=stop_reason,
                             )
-                        if step_progression <= StepProgression.RESPONSE_RECEIVED:
-                            # TODO (cliandy): persist response if we get it back
-                            if settings.track_errored_messages:
-                                for message in initial_messages:
-                                    message.is_err = True
-                                    message.step_id = step_id
-                                await self.message_manager.create_many_messages_async(initial_messages, actor=self.actor)
-                        elif step_progression <= StepProgression.LOGGED_TRACE:
-                            if stop_reason is None:
-                                self.logger.error("Error in step after logging step")
-                                stop_reason = LettaStopReason(stop_reason=StopReasonType.error.value)
+                    if step_progression <= StepProgression.RESPONSE_RECEIVED:
+                        # TODO (cliandy): persist response if we get it back
+                        if settings.track_errored_messages:
+                            for message in initial_messages:
+                                message.is_err = True
+                                message.step_id = effective_step_id
+                            await self.message_manager.create_many_messages_async(initial_messages, actor=self.actor)
+                    elif step_progression <= StepProgression.LOGGED_TRACE:
+                        if stop_reason is None:
+                            self.logger.error("Error in step after logging step")
+                            stop_reason = LettaStopReason(stop_reason=StopReasonType.error.value)
+                        if logged_step:
                             await self.step_manager.update_step_stop_reason(self.actor, step_id, stop_reason.stop_reason)
-                        else:
-                            self.logger.error("Invalid StepProgression value")
+                    else:
+                        self.logger.error("Invalid StepProgression value")
+                    if settings.track_stop_reason:
                         await self._log_request(request_start_timestamp_ns, request_span)
-                    except Exception as e:
-                        self.logger.error("Failed to update step: %s", e)
+                except Exception as e:
+                    self.logger.error("Failed to update step: %s", e)
             if not should_continue:
                 break
@@ -484,6 +511,25 @@ class LettaAgent(BaseAgent):
             step_progression = StepProgression.START
             should_continue = False
+            # Create step early with PENDING status
+            logged_step = await self.step_manager.log_step_async(
+                actor=self.actor,
+                agent_id=agent_state.id,
+                provider_name=agent_state.llm_config.model_endpoint_type,
+                provider_category=agent_state.llm_config.provider_category or "base",
+                model=agent_state.llm_config.model,
+                model_endpoint=agent_state.llm_config.model_endpoint,
+                context_window_limit=agent_state.llm_config.context_window,
+                usage=UsageStatistics(completion_tokens=0, prompt_tokens=0, total_tokens=0),
+                provider_id=None,
+                job_id=run_id if run_id else self.current_run_id,
+                step_id=step_id,
+                project_id=agent_state.project_id,
+                status=StepStatus.PENDING,
+            )
+            # Only use step_id in messages if step was actually created
+            effective_step_id = step_id if logged_step else None
             try:
                 request_data, response_data, current_in_context_messages, new_in_context_messages, valid_tool_names = (
                     await self._build_and_request_from_llm(
@@ -533,7 +579,7 @@ class LettaAgent(BaseAgent):
                     tool_rules_solver,
                     response.usage,
                     reasoning_content=reasoning,
-                    step_id=step_id,
+                    step_id=effective_step_id,
                     initial_messages=initial_messages,
                     agent_step_span=agent_step_span,
                     is_final_step=(i == max_steps - 1),
@@ -541,6 +587,10 @@ class LettaAgent(BaseAgent):
                 )
                 step_progression = StepProgression.STEP_LOGGED
+                # Update step with actual usage now that we have it (if step was created)
+                if logged_step:
+                    await self.step_manager.update_step_success_async(self.actor, step_id, response.usage, stop_reason)
                 new_message_idx = len(initial_messages) if initial_messages else 0
                 self.response_messages.extend(persisted_messages[new_message_idx:])
                 new_in_context_messages.extend(persisted_messages[new_message_idx:])
@@ -560,7 +610,7 @@ class LettaAgent(BaseAgent):
                     provider_trace_create=ProviderTraceCreate(
                         request_json=request_data,
                         response_json=response_data,
-                        step_id=step_id,
+                        step_id=step_id,  # Use original step_id for telemetry
                         organization_id=self.actor.organization_id,
                     ),
                 )
@@ -584,54 +634,56 @@ class LettaAgent(BaseAgent):
                 # Update step if it needs to be updated
             finally:
-                if settings.track_stop_reason:
-                    if step_progression == StepProgression.FINISHED and should_continue:
-                        continue
-                    self.logger.debug("Running cleanup for agent loop run: %s", self.current_run_id)
-                    self.logger.info("Running final update. Step Progression: %s", step_progression)
-                    try:
-                        if step_progression == StepProgression.FINISHED and not should_continue:
-                            if stop_reason is None:
-                                stop_reason = LettaStopReason(stop_reason=StopReasonType.end_turn.value)
-                            await self.step_manager.update_step_stop_reason(self.actor, step_id, stop_reason.stop_reason)
-                            break
+                if step_progression == StepProgression.FINISHED and should_continue:
+                    continue
-                        if step_progression < StepProgression.STEP_LOGGED:
-                            await self.step_manager.log_step_async(
+                self.logger.debug("Running cleanup for agent loop run: %s", self.current_run_id)
+                self.logger.info("Running final update. Step Progression: %s", step_progression)
+                try:
+                    if step_progression == StepProgression.FINISHED and not should_continue:
+                        # Successfully completed - update with final usage and stop reason
+                        if stop_reason is None:
+                            stop_reason = LettaStopReason(stop_reason=StopReasonType.end_turn.value)
+                        if logged_step:
+                            await self.step_manager.update_step_success_async(self.actor, step_id, usage, stop_reason)
+                        break
+                    # Handle error cases
+                    if step_progression < StepProgression.STEP_LOGGED:
+                        # Error occurred before step was fully logged
+                        import traceback
+                        if logged_step:
+                            await self.step_manager.update_step_error_async(
                                 actor=self.actor,
-                                agent_id=agent_state.id,
-                                provider_name=agent_state.llm_config.model_endpoint_type,
-                                provider_category=agent_state.llm_config.provider_category or "base",
-                                model=agent_state.llm_config.model,
-                                model_endpoint=agent_state.llm_config.model_endpoint,
-                                context_window_limit=agent_state.llm_config.context_window,
-                                usage=UsageStatistics(completion_tokens=0, prompt_tokens=0, total_tokens=0),
-                                provider_id=None,
-                                job_id=self.current_run_id if self.current_run_id else None,
-                                step_id=step_id,
-                                project_id=agent_state.project_id,
+                                step_id=step_id,  # Use original step_id for telemetry
+                                error_type=type(e).__name__ if "e" in locals() else "Unknown",
+                                error_message=str(e) if "e" in locals() else "Unknown error",
+                                error_traceback=traceback.format_exc(),
                                 stop_reason=stop_reason,
                             )
-                        if step_progression <= StepProgression.RESPONSE_RECEIVED:
-                            # TODO (cliandy): persist response if we get it back
-                            if settings.track_errored_messages:
-                                for message in initial_messages:
-                                    message.is_err = True
-                                    message.step_id = step_id
-                                await self.message_manager.create_many_messages_async(initial_messages, actor=self.actor)
-                        elif step_progression <= StepProgression.LOGGED_TRACE:
-                            if stop_reason is None:
-                                self.logger.error("Error in step after logging step")
-                                stop_reason = LettaStopReason(stop_reason=StopReasonType.error.value)
+                    if step_progression <= StepProgression.RESPONSE_RECEIVED:
+                        # TODO (cliandy): persist response if we get it back
+                        if settings.track_errored_messages:
+                            for message in initial_messages:
+                                message.is_err = True
+                                message.step_id = effective_step_id
+                            await self.message_manager.create_many_messages_async(initial_messages, actor=self.actor)
+                    elif step_progression <= StepProgression.LOGGED_TRACE:
+                        if stop_reason is None:
+                            self.logger.error("Error in step after logging step")
+                            stop_reason = LettaStopReason(stop_reason=StopReasonType.error.value)
+                        if logged_step:
                             await self.step_manager.update_step_stop_reason(self.actor, step_id, stop_reason.stop_reason)
-                        else:
-                            self.logger.error("Invalid StepProgression value")
+                    else:
+                        self.logger.error("Invalid StepProgression value")
+                    if settings.track_stop_reason:
                         await self._log_request(request_start_timestamp_ns, request_span)
-                    except Exception as e:
-                        self.logger.error("Failed to update step: %s", e)
+                except Exception as e:
+                    self.logger.error("Failed to update step: %s", e)
             if not should_continue:
                 break
@@ -717,6 +769,26 @@ class LettaAgent(BaseAgent):
             step_progression = StepProgression.START
             should_continue = False
+            # Create step early with PENDING status
+            logged_step = await self.step_manager.log_step_async(
+                actor=self.actor,
+                agent_id=agent_state.id,
+                provider_name=agent_state.llm_config.model_endpoint_type,
+                provider_category=agent_state.llm_config.provider_category or "base",
+                model=agent_state.llm_config.model,
+                model_endpoint=agent_state.llm_config.model_endpoint,
+                context_window_limit=agent_state.llm_config.context_window,
+                usage=UsageStatistics(completion_tokens=0, prompt_tokens=0, total_tokens=0),
+                provider_id=None,
+                job_id=self.current_run_id if self.current_run_id else None,
+                step_id=step_id,
+                project_id=agent_state.project_id,
+                status=StepStatus.PENDING,
+            )
+            # Only use step_id in messages if step was actually created
+            effective_step_id = step_id if logged_step else None
             try:
                 (
                     request_data,
@@ -827,13 +899,26 @@ class LettaAgent(BaseAgent):
                     ),
                     reasoning_content=reasoning_content,
                     pre_computed_assistant_message_id=interface.letta_message_id,
-                    step_id=step_id,
+                    step_id=effective_step_id,
                     initial_messages=initial_messages,
                     agent_step_span=agent_step_span,
                     is_final_step=(i == max_steps - 1),
                 )
                 step_progression = StepProgression.STEP_LOGGED
+                # Update step with actual usage now that we have it (if step was created)
+                if logged_step:
+                    await self.step_manager.update_step_success_async(
+                        self.actor,
+                        step_id,
+                        UsageStatistics(
+                            completion_tokens=usage.completion_tokens,
+                            prompt_tokens=usage.prompt_tokens,
+                            total_tokens=usage.total_tokens,
+                        ),
+                        stop_reason,
+                    )
                 new_message_idx = len(initial_messages) if initial_messages else 0
                 self.response_messages.extend(persisted_messages[new_message_idx:])
                 new_in_context_messages.extend(persisted_messages[new_message_idx:])
@@ -872,7 +957,7 @@ class LettaAgent(BaseAgent):
                                 "output_tokens": usage.completion_tokens,
                             },
                         },
-                        step_id=step_id,
+                        step_id=step_id,  # Use original step_id for telemetry
                         organization_id=self.actor.organization_id,
                     ),
                 )
@@ -907,54 +992,57 @@ class LettaAgent(BaseAgent):
             # Update step if it needs to be updated
             finally:
-                if settings.track_stop_reason:
-                    if step_progression == StepProgression.FINISHED and should_continue:
-                        continue
-                    self.logger.debug("Running cleanup for agent loop run: %s", self.current_run_id)
-                    self.logger.info("Running final update. Step Progression: %s", step_progression)
-                    try:
-                        if step_progression == StepProgression.FINISHED and not should_continue:
-                            if stop_reason is None:
-                                stop_reason = LettaStopReason(stop_reason=StopReasonType.end_turn.value)
+                if step_progression == StepProgression.FINISHED and should_continue:
+                    continue
+                self.logger.debug("Running cleanup for agent loop run: %s", self.current_run_id)
+                self.logger.info("Running final update. Step Progression: %s", step_progression)
+                try:
+                    if step_progression == StepProgression.FINISHED and not should_continue:
+                        # Successfully completed - update with final usage and stop reason
+                        if stop_reason is None:
+                            stop_reason = LettaStopReason(stop_reason=StopReasonType.end_turn.value)
+                        # Note: step already updated with success status after _handle_ai_response
+                        if logged_step:
                             await self.step_manager.update_step_stop_reason(self.actor, step_id, stop_reason.stop_reason)
-                            break
+                        break
+                    # Handle error cases
+                    if step_progression < StepProgression.STEP_LOGGED:
+                        # Error occurred before step was fully logged
+                        import traceback
-                        if step_progression < StepProgression.STEP_LOGGED:
-                            await self.step_manager.log_step_async(
+                        if logged_step:
+                            await self.step_manager.update_step_error_async(
                                 actor=self.actor,
-                                agent_id=agent_state.id,
-                                provider_name=agent_state.llm_config.model_endpoint_type,
-                                provider_category=agent_state.llm_config.provider_category or "base",
-                                model=agent_state.llm_config.model,
-                                model_endpoint=agent_state.llm_config.model_endpoint,
-                                context_window_limit=agent_state.llm_config.context_window,
-                                usage=UsageStatistics(completion_tokens=0, prompt_tokens=0, total_tokens=0),
-                                provider_id=None,
-                                job_id=self.current_run_id if self.current_run_id else None,
-                                step_id=step_id,
-                                project_id=agent_state.project_id,
+                                step_id=step_id,  # Use original step_id for telemetry
+                                error_type=type(e).__name__ if "e" in locals() else "Unknown",
+                                error_message=str(e) if "e" in locals() else "Unknown error",
+                                error_traceback=traceback.format_exc(),
                                 stop_reason=stop_reason,
                             )
-                        if step_progression <= StepProgression.STREAM_RECEIVED:
-                            if first_chunk and settings.track_errored_messages:
-                                for message in initial_messages:
-                                    message.is_err = True
-                                    message.step_id = step_id
-                                await self.message_manager.create_many_messages_async(initial_messages, actor=self.actor)
-                        elif step_progression <= StepProgression.LOGGED_TRACE:
-                            if stop_reason is None:
-                                self.logger.error("Error in step after logging step")
-                                stop_reason = LettaStopReason(stop_reason=StopReasonType.error.value)
+                    if step_progression <= StepProgression.STREAM_RECEIVED:
+                        if first_chunk and settings.track_errored_messages:
+                            for message in initial_messages:
+                                message.is_err = True
+                                message.step_id = effective_step_id
+                            await self.message_manager.create_many_messages_async(initial_messages, actor=self.actor)
+                    elif step_progression <= StepProgression.LOGGED_TRACE:
+                        if stop_reason is None:
+                            self.logger.error("Error in step after logging step")
+                            stop_reason = LettaStopReason(stop_reason=StopReasonType.error.value)
+                        if logged_step:
                             await self.step_manager.update_step_stop_reason(self.actor, step_id, stop_reason.stop_reason)
-                        else:
-                            self.logger.error("Invalid StepProgression value")
+                    else:
+                        self.logger.error("Invalid StepProgression value")
-                        # Do tracking for failure cases. Can consolidate with success conditions later.
+                    # Do tracking for failure cases. Can consolidate with success conditions later.
+                    if settings.track_stop_reason:
                         await self._log_request(request_start_timestamp_ns, request_span)
-                    except Exception as e:
-                        self.logger.error("Failed to update step: %s", e)
+                except Exception as e:
+                    self.logger.error("Failed to update step: %s", e)
             if not should_continue:
                 break
@@ -1315,23 +1403,7 @@ class LettaAgent(BaseAgent):
             is_final_step=is_final_step,
         )
-        # 5.  Persist step + messages and propagate to jobs
-        logged_step = await self.step_manager.log_step_async(
-            actor=self.actor,
-            agent_id=agent_state.id,
-            provider_name=agent_state.llm_config.model_endpoint_type,
-            provider_category=agent_state.llm_config.provider_category or "base",
-            model=agent_state.llm_config.model,
-            model_endpoint=agent_state.llm_config.model_endpoint,
-            context_window_limit=agent_state.llm_config.context_window,
-            usage=usage,
-            provider_id=None,
-            job_id=run_id if run_id else self.current_run_id,
-            step_id=step_id,
-            project_id=agent_state.project_id,
-            stop_reason=stop_reason,
-        )
+        # 5.  Create messages (step was already created at the beginning)
         tool_call_messages = create_letta_messages_from_llm_response(
             agent_id=agent_state.id,
             model=agent_state.llm_config.model,
@@ -1347,7 +1419,7 @@ class LettaAgent(BaseAgent):
             heartbeat_reason=heartbeat_reason,
             reasoning_content=reasoning_content,
             pre_computed_assistant_message_id=pre_computed_assistant_message_id,
-            step_id=logged_step.id if logged_step else None,
+            step_id=step_id,
         )
         persisted_messages = await self.message_manager.create_many_messages_async(

letta/constants.py CHANGED Viewed

@@ -10,6 +10,7 @@ DEFAULT_TIMEZONE = "UTC"
 ADMIN_PREFIX = "/v1/admin"
 API_PREFIX = "/v1"
+OLLAMA_API_PREFIX = "/v1"
 OPENAI_API_PREFIX = "/openai"
 COMPOSIO_ENTITY_ENV_VAR_KEY = "COMPOSIO_ENTITY"
@@ -50,8 +51,9 @@ TOOL_CALL_ID_MAX_LEN = 29
 # Max steps for agent loop
 DEFAULT_MAX_STEPS = 50
-# minimum context window size
+# context window size
 MIN_CONTEXT_WINDOW = 4096
+DEFAULT_CONTEXT_WINDOW = 32000
 # number of concurrent embedding requests to sent
 EMBEDDING_BATCH_SIZE = 200
@@ -63,6 +65,7 @@ DEFAULT_MIN_MESSAGE_BUFFER_LENGTH = 15
 # embeddings
 MAX_EMBEDDING_DIM = 4096  # maximum supported embeding size - do NOT change or else DBs will need to be reset
 DEFAULT_EMBEDDING_CHUNK_SIZE = 300
+DEFAULT_EMBEDDING_DIM = 1024
 # tokenizers
 EMBEDDING_TO_TOKENIZER_MAP = {

letta/embeddings.py CHANGED Viewed

@@ -139,10 +139,11 @@ class AzureOpenAIEmbedding:
 class OllamaEmbeddings:
+    # Uses OpenAI API standard
     # Format:
-    # curl http://localhost:11434/api/embeddings -d '{
+    # curl http://localhost:11434/v1/embeddings -d '{
     #   "model": "mxbai-embed-large",
-    #   "prompt": "Llamas are members of the camelid family"
+    #   "input": "Llamas are members of the camelid family"
     # }'
     def __init__(self, model: str, base_url: str, ollama_additional_kwargs: dict):
@@ -154,18 +155,18 @@ class OllamaEmbeddings:
         import httpx
         headers = {"Content-Type": "application/json"}
-        json_data = {"model": self.model, "prompt": text}
+        json_data = {"model": self.model, "input": text}
         json_data.update(self.ollama_additional_kwargs)
         with httpx.Client() as client:
             response = client.post(
-                f"{self.base_url}/api/embeddings",
+                f"{self.base_url}/embeddings",
                 headers=headers,
                 json=json_data,
             )
         response_json = response.json()
-        return response_json["embedding"]
+        return response_json["data"][0]["embedding"]
 class GoogleEmbeddings:

letta/functions/function_sets/base.py CHANGED Viewed

@@ -191,14 +191,14 @@ SNIPPET_LINES: int = 4
 # Based off of: https://github.com/anthropics/anthropic-quickstarts/blob/main/computer-use-demo/computer_use_demo/tools/edit.py?ref=musings.yasyf.com#L154
-def memory_replace(agent_state: "AgentState", label: str, old_str: str, new_str: Optional[str] = None) -> str:  # type: ignore
+def memory_replace(agent_state: "AgentState", label: str, old_str: str, new_str: str) -> str:  # type: ignore
     """
     The memory_replace command allows you to replace a specific string in a memory block with a new string. This is used for making precise edits.
     Args:
         label (str): Section of the memory to be edited, identified by its label.
         old_str (str): The text to replace (must match exactly, including whitespace and indentation).
-        new_str (Optional[str]): The new text to insert in place of the old text. Omit this argument to delete the old_str.
+        new_str (str): The new text to insert in place of the old text. Do not include line number prefixes.
     Returns:
         str: The success message

letta-nightly 0.11.0.dev20250807104511__py3-none-any.whl → 0.11.0.dev20250808104456__py3-none-any.whl

letta-nightly 0.11.0.dev20250807104511py3-none-any.whl → 0.11.0.dev20250808104456py3-none-any.whl