PyPI - letta-nightly - Versions diffs - 0.8.0.dev20250606104326__py3-none-any.whl → 0.8.2.dev20250606215616__py3-none-any.whl - Mend

letta-nightly 0.8.0.dev20250606104326py3-none-any.whl → 0.8.2.dev20250606215616py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (96) hide show

letta/__init__.py +1 -1
letta/agent.py +1 -1
letta/agents/letta_agent.py +49 -29
letta/agents/letta_agent_batch.py +1 -2
letta/agents/voice_agent.py +19 -13
letta/agents/voice_sleeptime_agent.py +11 -3
letta/constants.py +18 -0
letta/data_sources/__init__.py +0 -0
letta/data_sources/redis_client.py +282 -0
letta/errors.py +0 -4
letta/functions/function_sets/files.py +58 -0
letta/functions/schema_generator.py +18 -1
letta/groups/sleeptime_multi_agent_v2.py +1 -1
letta/helpers/datetime_helpers.py +47 -3
letta/helpers/decorators.py +69 -0
letta/{services/helpers/noop_helper.py → helpers/singleton.py} +5 -0
letta/interfaces/anthropic_streaming_interface.py +43 -24
letta/interfaces/openai_streaming_interface.py +21 -19
letta/llm_api/anthropic.py +1 -1
letta/llm_api/anthropic_client.py +22 -14
letta/llm_api/google_vertex_client.py +1 -1
letta/llm_api/helpers.py +36 -30
letta/llm_api/llm_api_tools.py +1 -1
letta/llm_api/llm_client_base.py +29 -1
letta/llm_api/openai.py +1 -1
letta/llm_api/openai_client.py +6 -8
letta/local_llm/chat_completion_proxy.py +1 -1
letta/memory.py +1 -1
letta/orm/enums.py +1 -0
letta/orm/file.py +80 -3
letta/orm/files_agents.py +13 -0
letta/orm/sqlalchemy_base.py +34 -11
letta/otel/__init__.py +0 -0
letta/otel/context.py +25 -0
letta/otel/events.py +0 -0
letta/otel/metric_registry.py +122 -0
letta/otel/metrics.py +66 -0
letta/otel/resource.py +26 -0
letta/{tracing.py → otel/tracing.py} +55 -78
letta/plugins/README.md +22 -0
letta/plugins/__init__.py +0 -0
letta/plugins/defaults.py +11 -0
letta/plugins/plugins.py +72 -0
letta/schemas/enums.py +8 -0
letta/schemas/file.py +12 -0
letta/schemas/tool.py +4 -0
letta/server/db.py +7 -7
letta/server/rest_api/app.py +8 -6
letta/server/rest_api/routers/v1/agents.py +37 -36
letta/server/rest_api/routers/v1/groups.py +3 -3
letta/server/rest_api/routers/v1/sources.py +26 -3
letta/server/rest_api/utils.py +9 -6
letta/server/server.py +18 -12
letta/services/agent_manager.py +185 -193
letta/services/block_manager.py +1 -1
letta/services/context_window_calculator/token_counter.py +3 -2
letta/services/file_processor/chunker/line_chunker.py +34 -0
letta/services/file_processor/file_processor.py +40 -11
letta/services/file_processor/parser/mistral_parser.py +11 -1
letta/services/files_agents_manager.py +96 -7
letta/services/group_manager.py +6 -6
letta/services/helpers/agent_manager_helper.py +373 -3
letta/services/identity_manager.py +1 -1
letta/services/job_manager.py +1 -1
letta/services/llm_batch_manager.py +1 -1
letta/services/message_manager.py +1 -1
letta/services/organization_manager.py +1 -1
letta/services/passage_manager.py +1 -1
letta/services/per_agent_lock_manager.py +1 -1
letta/services/provider_manager.py +1 -1
letta/services/sandbox_config_manager.py +1 -1
letta/services/source_manager.py +178 -19
letta/services/step_manager.py +2 -2
letta/services/summarizer/summarizer.py +1 -1
letta/services/telemetry_manager.py +1 -1
letta/services/tool_executor/builtin_tool_executor.py +117 -0
letta/services/tool_executor/composio_tool_executor.py +53 -0
letta/services/tool_executor/core_tool_executor.py +474 -0
letta/services/tool_executor/files_tool_executor.py +131 -0
letta/services/tool_executor/mcp_tool_executor.py +45 -0
letta/services/tool_executor/multi_agent_tool_executor.py +123 -0
letta/services/tool_executor/tool_execution_manager.py +34 -14
letta/services/tool_executor/tool_execution_sandbox.py +1 -1
letta/services/tool_executor/tool_executor.py +3 -802
letta/services/tool_executor/tool_executor_base.py +43 -0
letta/services/tool_manager.py +55 -59
letta/services/tool_sandbox/e2b_sandbox.py +1 -1
letta/services/tool_sandbox/local_sandbox.py +6 -3
letta/services/user_manager.py +6 -3
letta/settings.py +21 -1
letta/utils.py +7 -2
{letta_nightly-0.8.0.dev20250606104326.dist-info → letta_nightly-0.8.2.dev20250606215616.dist-info}/METADATA +4 -2
{letta_nightly-0.8.0.dev20250606104326.dist-info → letta_nightly-0.8.2.dev20250606215616.dist-info}/RECORD +96 -74
{letta_nightly-0.8.0.dev20250606104326.dist-info → letta_nightly-0.8.2.dev20250606215616.dist-info}/LICENSE +0 -0
{letta_nightly-0.8.0.dev20250606104326.dist-info → letta_nightly-0.8.2.dev20250606215616.dist-info}/WHEEL +0 -0
{letta_nightly-0.8.0.dev20250606104326.dist-info → letta_nightly-0.8.2.dev20250606215616.dist-info}/entry_points.txt +0 -0

letta/services/agent_manager.py CHANGED Viewed

@@ -3,9 +3,8 @@ import os
 from datetime import datetime, timezone
 from typing import Dict, List, Optional, Set, Tuple
-import numpy as np
 import sqlalchemy as sa
-from sqlalchemy import Select, and_, delete, func, insert, literal, or_, select, union_all
+from sqlalchemy import delete, func, insert, literal, or_, select
 from sqlalchemy.dialects.postgresql import insert as pg_insert
 from letta.constants import (
@@ -17,10 +16,9 @@ from letta.constants import (
     BASE_VOICE_SLEEPTIME_CHAT_TOOLS,
     BASE_VOICE_SLEEPTIME_TOOLS,
     DATA_SOURCE_ATTACH_ALERT,
-    MAX_EMBEDDING_DIM,
+    FILES_TOOLS,
     MULTI_AGENT_TOOLS,
 )
-from letta.embeddings import embedding_model
 from letta.helpers.datetime_helpers import get_utc_time
 from letta.llm_api.llm_client import LLMClient
 from letta.log import get_logger
@@ -39,7 +37,7 @@ from letta.orm.errors import NoResultFound
 from letta.orm.sandbox_config import AgentEnvironmentVariable
 from letta.orm.sandbox_config import AgentEnvironmentVariable as AgentEnvironmentVariableModel
 from letta.orm.sqlalchemy_base import AccessType
-from letta.orm.sqlite_functions import adapt_array
+from letta.otel.tracing import trace_method
 from letta.schemas.agent import AgentState as PydanticAgentState
 from letta.schemas.agent import AgentType, CreateAgent, UpdateAgent, get_prompt_template_for_agent_type
 from letta.schemas.block import DEFAULT_BLOCKS
@@ -66,6 +64,7 @@ from letta.server.db import db_registry
 from letta.services.block_manager import BlockManager
 from letta.services.context_window_calculator.context_window_calculator import ContextWindowCalculator
 from letta.services.context_window_calculator.token_counter import AnthropicTokenCounter, TiktokenCounter
+from letta.services.files_agents_manager import FileAgentManager
 from letta.services.helpers.agent_manager_helper import (
     _apply_filters,
     _apply_identity_filters,
@@ -74,6 +73,9 @@ from letta.services.helpers.agent_manager_helper import (
     _apply_tag_filter,
     _process_relationship,
     _process_relationship_async,
+    build_agent_passage_query,
+    build_passage_query,
+    build_source_passage_query,
     check_supports_structured_output,
     compile_system_message,
     derive_system_message,
@@ -85,8 +87,6 @@ from letta.services.message_manager import MessageManager
 from letta.services.passage_manager import PassageManager
 from letta.services.source_manager import SourceManager
 from letta.services.tool_manager import ToolManager
-from letta.settings import settings
-from letta.tracing import trace_method
 from letta.utils import enforce_types, united_diff
 logger = get_logger(__name__)
@@ -102,6 +102,7 @@ class AgentManager:
         self.message_manager = MessageManager()
         self.passage_manager = PassageManager()
         self.identity_manager = IdentityManager()
+        self.file_agent_manager = FileAgentManager()
     @staticmethod
     def _resolve_tools(session, names: Set[str], ids: Set[str], org_id: str) -> Tuple[Dict[str, str], Dict[str, str]]:
@@ -1384,6 +1385,11 @@ class AgentManager:
         curr_system_message = self.get_system_message(
             agent_id=agent_id, actor=actor
         )  # this is the system + memory bank, not just the system prompt
+        if curr_system_message is None:
+            logger.warning(f"No system message found for agent {agent_state.id} and user {actor}")
+            return agent_state
         curr_system_message_openai = curr_system_message.to_openai_dict()
         # note: we only update the system prompt if the core memory is changed
@@ -1451,6 +1457,11 @@ class AgentManager:
         curr_system_message = await self.get_system_message_async(
             agent_id=agent_id, actor=actor
         )  # this is the system + memory bank, not just the system prompt
+        if curr_system_message is None:
+            logger.warning(f"No system message found for agent {agent_state.id} and user {actor}")
+            return agent_state
         curr_system_message_openai = curr_system_message.to_openai_dict()
         # note: we only update the system prompt if the core memory is changed
@@ -1650,12 +1661,18 @@ class AgentManager:
     @trace_method
     @enforce_types
     async def refresh_memory_async(self, agent_state: PydanticAgentState, actor: PydanticUser) -> PydanticAgentState:
+        # TODO: This will NOT work for new blocks/file blocks added intra-step
         block_ids = [b.id for b in agent_state.memory.blocks]
-        if not block_ids:
-            return agent_state
+        file_block_names = [b.label for b in agent_state.memory.file_blocks]
+        if block_ids:
+            blocks = await self.block_manager.get_all_blocks_by_ids_async(block_ids=[b.id for b in agent_state.memory.blocks], actor=actor)
+            agent_state.memory.blocks = [b for b in blocks if b is not None]
+        if file_block_names:
+            file_blocks = await self.file_agent_manager.get_all_file_blocks_by_name(file_names=file_block_names, actor=actor)
+            agent_state.memory.file_blocks = [b for b in file_blocks if b is not None]
-        blocks = await self.block_manager.get_all_blocks_by_ids_async(block_ids=[b.id for b in agent_state.memory.blocks], actor=actor)
-        agent_state.memory.blocks = [b for b in blocks if b is not None]
         return agent_state
     # ======================================================================================================================
@@ -2006,184 +2023,6 @@ class AgentManager:
     # ======================================================================================================================
     # Passage Management
     # ======================================================================================================================
-    def _build_passage_query(
-        self,
-        actor: PydanticUser,
-        agent_id: Optional[str] = None,
-        file_id: Optional[str] = None,
-        query_text: Optional[str] = None,
-        start_date: Optional[datetime] = None,
-        end_date: Optional[datetime] = None,
-        before: Optional[str] = None,
-        after: Optional[str] = None,
-        source_id: Optional[str] = None,
-        embed_query: bool = False,
-        ascending: bool = True,
-        embedding_config: Optional[EmbeddingConfig] = None,
-        agent_only: bool = False,
-    ) -> Select:
-        """Helper function to build the base passage query with all filters applied.
-        Supports both before and after pagination across merged source and agent passages.
-        Returns the query before any limit or count operations are applied.
-        """
-        embedded_text = None
-        if embed_query:
-            assert embedding_config is not None, "embedding_config must be specified for vector search"
-            assert query_text is not None, "query_text must be specified for vector search"
-            embedded_text = embedding_model(embedding_config).get_text_embedding(query_text)
-            embedded_text = np.array(embedded_text)
-            embedded_text = np.pad(embedded_text, (0, MAX_EMBEDDING_DIM - embedded_text.shape[0]), mode="constant").tolist()
-        # Start with base query for source passages
-        source_passages = None
-        if not agent_only:  # Include source passages
-            if agent_id is not None:
-                source_passages = (
-                    select(SourcePassage, literal(None).label("agent_id"))
-                    .join(SourcesAgents, SourcesAgents.source_id == SourcePassage.source_id)
-                    .where(SourcesAgents.agent_id == agent_id)
-                    .where(SourcePassage.organization_id == actor.organization_id)
-                )
-            else:
-                source_passages = select(SourcePassage, literal(None).label("agent_id")).where(
-                    SourcePassage.organization_id == actor.organization_id
-                )
-            if source_id:
-                source_passages = source_passages.where(SourcePassage.source_id == source_id)
-            if file_id:
-                source_passages = source_passages.where(SourcePassage.file_id == file_id)
-        # Add agent passages query
-        agent_passages = None
-        if agent_id is not None:
-            agent_passages = (
-                select(
-                    AgentPassage.id,
-                    AgentPassage.text,
-                    AgentPassage.embedding_config,
-                    AgentPassage.metadata_,
-                    AgentPassage.embedding,
-                    AgentPassage.created_at,
-                    AgentPassage.updated_at,
-                    AgentPassage.is_deleted,
-                    AgentPassage._created_by_id,
-                    AgentPassage._last_updated_by_id,
-                    AgentPassage.organization_id,
-                    literal(None).label("file_id"),
-                    literal(None).label("source_id"),
-                    AgentPassage.agent_id,
-                )
-                .where(AgentPassage.agent_id == agent_id)
-                .where(AgentPassage.organization_id == actor.organization_id)
-            )
-        # Combine queries
-        if source_passages is not None and agent_passages is not None:
-            combined_query = union_all(source_passages, agent_passages).cte("combined_passages")
-        elif agent_passages is not None:
-            combined_query = agent_passages.cte("combined_passages")
-        elif source_passages is not None:
-            combined_query = source_passages.cte("combined_passages")
-        else:
-            raise ValueError("No passages found")
-        # Build main query from combined CTE
-        main_query = select(combined_query)
-        # Apply filters
-        if start_date:
-            main_query = main_query.where(combined_query.c.created_at >= start_date)
-        if end_date:
-            main_query = main_query.where(combined_query.c.created_at <= end_date)
-        if source_id:
-            main_query = main_query.where(combined_query.c.source_id == source_id)
-        if file_id:
-            main_query = main_query.where(combined_query.c.file_id == file_id)
-        # Vector search
-        if embedded_text:
-            if settings.letta_pg_uri_no_default:
-                # PostgreSQL with pgvector
-                main_query = main_query.order_by(combined_query.c.embedding.cosine_distance(embedded_text).asc())
-            else:
-                # SQLite with custom vector type
-                query_embedding_binary = adapt_array(embedded_text)
-                main_query = main_query.order_by(
-                    func.cosine_distance(combined_query.c.embedding, query_embedding_binary).asc(),
-                    combined_query.c.created_at.asc() if ascending else combined_query.c.created_at.desc(),
-                    combined_query.c.id.asc(),
-                )
-        else:
-            if query_text:
-                main_query = main_query.where(func.lower(combined_query.c.text).contains(func.lower(query_text)))
-        # Handle pagination
-        if before or after:
-            # Create reference CTEs
-            if before:
-                before_ref = select(combined_query.c.created_at, combined_query.c.id).where(combined_query.c.id == before).cte("before_ref")
-            if after:
-                after_ref = select(combined_query.c.created_at, combined_query.c.id).where(combined_query.c.id == after).cte("after_ref")
-            if before and after:
-                # Window-based query (get records between before and after)
-                main_query = main_query.where(
-                    or_(
-                        combined_query.c.created_at < select(before_ref.c.created_at).scalar_subquery(),
-                        and_(
-                            combined_query.c.created_at == select(before_ref.c.created_at).scalar_subquery(),
-                            combined_query.c.id < select(before_ref.c.id).scalar_subquery(),
-                        ),
-                    )
-                )
-                main_query = main_query.where(
-                    or_(
-                        combined_query.c.created_at > select(after_ref.c.created_at).scalar_subquery(),
-                        and_(
-                            combined_query.c.created_at == select(after_ref.c.created_at).scalar_subquery(),
-                            combined_query.c.id > select(after_ref.c.id).scalar_subquery(),
-                        ),
-                    )
-                )
-            else:
-                # Pure pagination (only before or only after)
-                if before:
-                    main_query = main_query.where(
-                        or_(
-                            combined_query.c.created_at < select(before_ref.c.created_at).scalar_subquery(),
-                            and_(
-                                combined_query.c.created_at == select(before_ref.c.created_at).scalar_subquery(),
-                                combined_query.c.id < select(before_ref.c.id).scalar_subquery(),
-                            ),
-                        )
-                    )
-                if after:
-                    main_query = main_query.where(
-                        or_(
-                            combined_query.c.created_at > select(after_ref.c.created_at).scalar_subquery(),
-                            and_(
-                                combined_query.c.created_at == select(after_ref.c.created_at).scalar_subquery(),
-                                combined_query.c.id > select(after_ref.c.id).scalar_subquery(),
-                            ),
-                        )
-                    )
-        # Add ordering if not already ordered by similarity
-        if not embed_query:
-            if ascending:
-                main_query = main_query.order_by(
-                    combined_query.c.created_at.asc(),
-                    combined_query.c.id.asc(),
-                )
-            else:
-                main_query = main_query.order_by(
-                    combined_query.c.created_at.desc(),
-                    combined_query.c.id.asc(),
-                )
-        return main_query
     @trace_method
     @enforce_types
@@ -2206,7 +2045,7 @@ class AgentManager:
     ) -> List[PydanticPassage]:
         """Lists all passages attached to an agent."""
         with db_registry.session() as session:
-            main_query = self._build_passage_query(
+            main_query = build_passage_query(
                 actor=actor,
                 agent_id=agent_id,
                 file_id=file_id,
@@ -2266,7 +2105,7 @@ class AgentManager:
     ) -> List[PydanticPassage]:
         """Lists all passages attached to an agent."""
         async with db_registry.async_session() as session:
-            main_query = self._build_passage_query(
+            main_query = build_passage_query(
                 actor=actor,
                 agent_id=agent_id,
                 file_id=file_id,
@@ -2305,6 +2144,100 @@ class AgentManager:
             return [p.to_pydantic() for p in passages]
+    @trace_method
+    @enforce_types
+    async def list_source_passages_async(
+        self,
+        actor: PydanticUser,
+        agent_id: Optional[str] = None,
+        file_id: Optional[str] = None,
+        limit: Optional[int] = 50,
+        query_text: Optional[str] = None,
+        start_date: Optional[datetime] = None,
+        end_date: Optional[datetime] = None,
+        before: Optional[str] = None,
+        after: Optional[str] = None,
+        source_id: Optional[str] = None,
+        embed_query: bool = False,
+        ascending: bool = True,
+        embedding_config: Optional[EmbeddingConfig] = None,
+    ) -> List[PydanticPassage]:
+        """Lists all passages attached to an agent."""
+        async with db_registry.async_session() as session:
+            main_query = build_source_passage_query(
+                actor=actor,
+                agent_id=agent_id,
+                file_id=file_id,
+                query_text=query_text,
+                start_date=start_date,
+                end_date=end_date,
+                before=before,
+                after=after,
+                source_id=source_id,
+                embed_query=embed_query,
+                ascending=ascending,
+                embedding_config=embedding_config,
+            )
+            # Add limit
+            if limit:
+                main_query = main_query.limit(limit)
+            # Execute query
+            result = await session.execute(main_query)
+            # Get ORM objects directly using scalars()
+            passages = result.scalars().all()
+            # Convert to Pydantic models
+            return [p.to_pydantic() for p in passages]
+    @trace_method
+    @enforce_types
+    async def list_agent_passages_async(
+        self,
+        actor: PydanticUser,
+        agent_id: Optional[str] = None,
+        file_id: Optional[str] = None,
+        limit: Optional[int] = 50,
+        query_text: Optional[str] = None,
+        start_date: Optional[datetime] = None,
+        end_date: Optional[datetime] = None,
+        before: Optional[str] = None,
+        after: Optional[str] = None,
+        source_id: Optional[str] = None,
+        embed_query: bool = False,
+        ascending: bool = True,
+        embedding_config: Optional[EmbeddingConfig] = None,
+    ) -> List[PydanticPassage]:
+        """Lists all passages attached to an agent."""
+        async with db_registry.async_session() as session:
+            main_query = build_agent_passage_query(
+                actor=actor,
+                agent_id=agent_id,
+                query_text=query_text,
+                start_date=start_date,
+                end_date=end_date,
+                before=before,
+                after=after,
+                embed_query=embed_query,
+                ascending=ascending,
+                embedding_config=embedding_config,
+            )
+            # Add limit
+            if limit:
+                main_query = main_query.limit(limit)
+            # Execute query
+            result = await session.execute(main_query)
+            # Get ORM objects directly using scalars()
+            passages = result.scalars().all()
+            # Convert to Pydantic models
+            return [p.to_pydantic() for p in passages]
     @trace_method
     @enforce_types
     def passage_size(
@@ -2325,7 +2258,7 @@ class AgentManager:
     ) -> int:
         """Returns the count of passages matching the given criteria."""
         with db_registry.session() as session:
-            main_query = self._build_passage_query(
+            main_query = build_passage_query(
                 actor=actor,
                 agent_id=agent_id,
                 file_id=file_id,
@@ -2363,7 +2296,7 @@ class AgentManager:
         agent_only: bool = False,
     ) -> int:
         async with db_registry.async_session() as session:
-            main_query = self._build_passage_query(
+            main_query = build_passage_query(
                 actor=actor,
                 agent_id=agent_id,
                 file_id=file_id,
@@ -2458,6 +2391,65 @@ class AgentManager:
             await agent.update_async(session, actor=actor)
             return await agent.to_pydantic_async()
+    @trace_method
+    @enforce_types
+    async def attach_missing_files_tools_async(self, agent_state: PydanticAgentState, actor: PydanticUser) -> PydanticAgentState:
+        """
+        Attaches missing core file tools to an agent.
+        Args:
+            agent_id: ID of the agent to attach the tools to.
+            actor: User performing the action.
+        Raises:
+            NoResultFound: If the agent or tool is not found.
+        Returns:
+            PydanticAgentState: The updated agent state.
+        """
+        # Check if the agent is missing any files tools
+        core_tool_names = {tool.name for tool in agent_state.tools if tool.tool_type == ToolType.LETTA_FILES_CORE}
+        missing_tool_names = set(FILES_TOOLS).difference(core_tool_names)
+        for tool_name in missing_tool_names:
+            tool_id = await self.tool_manager.get_tool_id_by_name_async(tool_name=tool_name, actor=actor)
+            # TODO: This is hacky and deserves a rethink - how do we keep all the base tools available in every org always?
+            if not tool_id:
+                await self.tool_manager.upsert_base_tools_async(actor=actor, allowed_types={ToolType.LETTA_FILES_CORE})
+            # TODO: Inefficient - I think this re-retrieves the agent_state?
+            agent_state = await self.attach_tool_async(agent_id=agent_state.id, tool_id=tool_id, actor=actor)
+        return agent_state
+    @trace_method
+    @enforce_types
+    async def detach_all_files_tools_async(self, agent_state: PydanticAgentState, actor: PydanticUser) -> PydanticAgentState:
+        """
+        Detach all core file tools from an agent.
+        Args:
+            agent_id: ID of the agent to detach the tools from.
+            actor: User performing the action.
+        Raises:
+            NoResultFound: If the agent or tool is not found.
+        Returns:
+            PydanticAgentState: The updated agent state.
+        """
+        # Check if the agent is missing any files tools
+        core_tool_names = {tool.name for tool in agent_state.tools if tool.tool_type == ToolType.LETTA_FILES_CORE}
+        for tool_name in core_tool_names:
+            tool_id = await self.tool_manager.get_tool_id_by_name_async(tool_name=tool_name, actor=actor)
+            # TODO: Inefficient - I think this re-retrieves the agent_state?
+            agent_state = await self.detach_tool_async(agent_id=agent_state.id, tool_id=tool_id, actor=actor)
+        return agent_state
     @trace_method
     @enforce_types
     def detach_tool(self, agent_id: str, tool_id: str, actor: PydanticUser) -> PydanticAgentState:

letta/services/block_manager.py CHANGED Viewed

@@ -9,12 +9,12 @@ from letta.orm.block import Block as BlockModel
 from letta.orm.block_history import BlockHistory
 from letta.orm.enums import ActorType
 from letta.orm.errors import NoResultFound
+from letta.otel.tracing import trace_method
 from letta.schemas.agent import AgentState as PydanticAgentState
 from letta.schemas.block import Block as PydanticBlock
 from letta.schemas.block import BlockUpdate
 from letta.schemas.user import User as PydanticUser
 from letta.server.db import db_registry
-from letta.tracing import trace_method
 from letta.utils import enforce_types
 logger = get_logger(__name__)

letta/services/context_window_calculator/token_counter.py CHANGED Viewed

@@ -2,6 +2,7 @@ from abc import ABC, abstractmethod
 from typing import Any, Dict, List
 from letta.llm_api.anthropic_client import AnthropicClient
+from letta.schemas.openai.chat_completion_request import Tool as OpenAITool
 from letta.utils import count_tokens
@@ -42,7 +43,7 @@ class AnthropicTokenCounter(TokenCounter):
             return 0
         return await self.client.count_tokens(model=self.model, messages=messages)
-    async def count_tool_tokens(self, tools: List[Any]) -> int:
+    async def count_tool_tokens(self, tools: List[OpenAITool]) -> int:
         if not tools:
             return 0
         return await self.client.count_tokens(model=self.model, tools=tools)
@@ -69,7 +70,7 @@ class TiktokenCounter(TokenCounter):
         return num_tokens_from_messages(messages=messages, model=self.model)
-    async def count_tool_tokens(self, tools: List[Any]) -> int:
+    async def count_tool_tokens(self, tools: List[OpenAITool]) -> int:
         if not tools:
             return 0
         from letta.local_llm.utils import num_tokens_from_functions

letta/services/file_processor/chunker/line_chunker.py ADDED Viewed

@@ -0,0 +1,34 @@
+from typing import List, Optional
+from letta.log import get_logger
+logger = get_logger(__name__)
+class LineChunker:
+    """Newline chunker"""
+    def __init__(self):
+        pass
+    # TODO: Make this more general beyond Mistral
+    def chunk_text(self, text: str, start: Optional[int] = None, end: Optional[int] = None) -> List[str]:
+        """Split lines"""
+        content_lines = [line.strip() for line in text.split("\n") if line.strip()]
+        total_lines = len(content_lines)
+        if start and end:
+            content_lines = content_lines[start:end]
+            line_offset = start
+        else:
+            line_offset = 0
+        content_lines = [f"Line {i + line_offset}: {line}" for i, line in enumerate(content_lines)]
+        # Add metadata about total lines
+        if start and end:
+            content_lines.insert(0, f"[Viewing lines {start} to {end} (out of {total_lines} lines)]")
+        else:
+            content_lines.insert(0, f"[Viewing file start (out of {total_lines} lines)]")
+        return content_lines

letta/services/file_processor/file_processor.py CHANGED Viewed

@@ -5,12 +5,13 @@ from fastapi import UploadFile
 from letta.log import get_logger
 from letta.schemas.agent import AgentState
-from letta.schemas.enums import JobStatus
+from letta.schemas.enums import FileProcessingStatus, JobStatus
 from letta.schemas.file import FileMetadata
 from letta.schemas.job import Job, JobUpdate
 from letta.schemas.passage import Passage
 from letta.schemas.user import User
 from letta.server.server import SyncServer
+from letta.services.file_processor.chunker.line_chunker import LineChunker
 from letta.services.file_processor.chunker.llama_index_chunker import LlamaIndexChunker
 from letta.services.file_processor.embedder.openai_embedder import OpenAIEmbedder
 from letta.services.file_processor.parser.mistral_parser import MistralFileParser
@@ -34,6 +35,7 @@ class FileProcessor:
     ):
         self.file_parser = file_parser
         self.text_chunker = text_chunker
+        self.line_chunker = LineChunker()
         self.embedder = embedder
         self.max_file_size = max_file_size
         self.source_manager = SourceManager()
@@ -52,9 +54,12 @@ class FileProcessor:
         job: Optional[Job] = None,
     ) -> List[Passage]:
         file_metadata = self._extract_upload_file_metadata(file, source_id=source_id)
-        file_metadata = await self.source_manager.create_file(file_metadata, self.actor)
         filename = file_metadata.file_name
+        # Create file as early as possible with no content
+        file_metadata.processing_status = FileProcessingStatus.PARSING  # Parsing now
+        file_metadata = await self.source_manager.create_file(file_metadata, self.actor)
         try:
             # Ensure we're working with bytes
             if isinstance(content, str):
@@ -66,11 +71,35 @@ class FileProcessor:
             logger.info(f"Starting OCR extraction for {filename}")
             ocr_response = await self.file_parser.extract_text(content, mime_type=file_metadata.file_type)
+            # update file with raw text
+            raw_markdown_text = "".join([page.markdown for page in ocr_response.pages])
+            file_metadata = await self.source_manager.upsert_file_content(
+                file_id=file_metadata.id, text=raw_markdown_text, actor=self.actor
+            )
+            file_metadata = await self.source_manager.update_file_status(
+                file_id=file_metadata.id, actor=self.actor, processing_status=FileProcessingStatus.EMBEDDING
+            )
+            # Insert to agent context window
+            # TODO: Rethink this line chunking mechanism
+            content_lines = self.line_chunker.chunk_text(text=raw_markdown_text)
+            visible_content = "\n".join(content_lines)
+            await server.insert_file_into_context_windows(
+                source_id=source_id,
+                text=visible_content,
+                file_id=file_metadata.id,
+                file_name=file_metadata.file_name,
+                actor=self.actor,
+                agent_states=agent_states,
+            )
             if not ocr_response or len(ocr_response.pages) == 0:
                 raise ValueError("No text extracted from PDF")
             logger.info("Chunking extracted text")
             all_passages = []
             for page in ocr_response.pages:
                 chunks = self.text_chunker.chunk_text(page)
@@ -86,24 +115,20 @@ class FileProcessor:
             logger.info(f"Successfully processed {filename}: {len(all_passages)} passages")
-            await server.insert_file_into_context_windows(
-                source_id=source_id,
-                text="".join([ocr_response.pages[i].markdown for i in range(min(3, len(ocr_response.pages)))]),
-                file_id=file_metadata.id,
-                actor=self.actor,
-                agent_states=agent_states,
-            )
             # update job status
             if job:
                 job.status = JobStatus.completed
                 job.metadata["num_passages"] = len(all_passages)
                 await self.job_manager.update_job_by_id_async(job_id=job.id, job_update=JobUpdate(**job.model_dump()), actor=self.actor)
+            await self.source_manager.update_file_status(
+                file_id=file_metadata.id, actor=self.actor, processing_status=FileProcessingStatus.COMPLETED
+            )
             return all_passages
         except Exception as e:
-            logger.error(f"PDF processing failed for {filename}: {str(e)}")
+            logger.error(f"File processing failed for {filename}: {str(e)}")
             # update job status
             if job:
@@ -111,6 +136,10 @@ class FileProcessor:
                 job.metadata["error"] = str(e)
                 await self.job_manager.update_job_by_id_async(job_id=job.id, job_update=JobUpdate(**job.model_dump()), actor=self.actor)
+            await self.source_manager.update_file_status(
+                file_id=file_metadata.id, actor=self.actor, processing_status=FileProcessingStatus.ERROR, error_message=str(e)
+            )
             return []
     def _extract_upload_file_metadata(self, file: UploadFile, source_id: str) -> FileMetadata:

letta-nightly 0.8.0.dev20250606104326__py3-none-any.whl → 0.8.2.dev20250606215616__py3-none-any.whl

letta-nightly 0.8.0.dev20250606104326py3-none-any.whl → 0.8.2.dev20250606215616py3-none-any.whl