PyPI - letta-nightly - Versions diffs - 0.1.7.dev20240924104148__py3-none-any.whl - Mend

letta-nightly 0.1.7.dev20240924104148__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of letta-nightly might be problematic. Click here for more details.

Files changed (189) hide show

letta/__init__.py +24 -0
letta/__main__.py +3 -0
letta/agent.py +1427 -0
letta/agent_store/chroma.py +295 -0
letta/agent_store/db.py +546 -0
letta/agent_store/lancedb.py +177 -0
letta/agent_store/milvus.py +198 -0
letta/agent_store/qdrant.py +201 -0
letta/agent_store/storage.py +188 -0
letta/benchmark/benchmark.py +96 -0
letta/benchmark/constants.py +14 -0
letta/cli/cli.py +689 -0
letta/cli/cli_config.py +1282 -0
letta/cli/cli_load.py +166 -0
letta/client/__init__.py +0 -0
letta/client/admin.py +171 -0
letta/client/client.py +2360 -0
letta/client/streaming.py +90 -0
letta/client/utils.py +61 -0
letta/config.py +484 -0
letta/configs/anthropic.json +13 -0
letta/configs/letta_hosted.json +11 -0
letta/configs/openai.json +12 -0
letta/constants.py +134 -0
letta/credentials.py +140 -0
letta/data_sources/connectors.py +247 -0
letta/embeddings.py +218 -0
letta/errors.py +26 -0
letta/functions/__init__.py +0 -0
letta/functions/function_sets/base.py +174 -0
letta/functions/function_sets/extras.py +132 -0
letta/functions/functions.py +105 -0
letta/functions/schema_generator.py +205 -0
letta/humans/__init__.py +0 -0
letta/humans/examples/basic.txt +1 -0
letta/humans/examples/cs_phd.txt +9 -0
letta/interface.py +314 -0
letta/llm_api/__init__.py +0 -0
letta/llm_api/anthropic.py +383 -0
letta/llm_api/azure_openai.py +155 -0
letta/llm_api/cohere.py +396 -0
letta/llm_api/google_ai.py +468 -0
letta/llm_api/llm_api_tools.py +485 -0
letta/llm_api/openai.py +470 -0
letta/local_llm/README.md +3 -0
letta/local_llm/__init__.py +0 -0
letta/local_llm/chat_completion_proxy.py +279 -0
letta/local_llm/constants.py +31 -0
letta/local_llm/function_parser.py +68 -0
letta/local_llm/grammars/__init__.py +0 -0
letta/local_llm/grammars/gbnf_grammar_generator.py +1324 -0
letta/local_llm/grammars/json.gbnf +26 -0
letta/local_llm/grammars/json_func_calls_with_inner_thoughts.gbnf +32 -0
letta/local_llm/groq/api.py +97 -0
letta/local_llm/json_parser.py +202 -0
letta/local_llm/koboldcpp/api.py +62 -0
letta/local_llm/koboldcpp/settings.py +23 -0
letta/local_llm/llamacpp/api.py +58 -0
letta/local_llm/llamacpp/settings.py +22 -0
letta/local_llm/llm_chat_completion_wrappers/__init__.py +0 -0
letta/local_llm/llm_chat_completion_wrappers/airoboros.py +452 -0
letta/local_llm/llm_chat_completion_wrappers/chatml.py +470 -0
letta/local_llm/llm_chat_completion_wrappers/configurable_wrapper.py +387 -0
letta/local_llm/llm_chat_completion_wrappers/dolphin.py +246 -0
letta/local_llm/llm_chat_completion_wrappers/llama3.py +345 -0
letta/local_llm/llm_chat_completion_wrappers/simple_summary_wrapper.py +156 -0
letta/local_llm/llm_chat_completion_wrappers/wrapper_base.py +11 -0
letta/local_llm/llm_chat_completion_wrappers/zephyr.py +345 -0
letta/local_llm/lmstudio/api.py +100 -0
letta/local_llm/lmstudio/settings.py +29 -0
letta/local_llm/ollama/api.py +88 -0
letta/local_llm/ollama/settings.py +32 -0
letta/local_llm/settings/__init__.py +0 -0
letta/local_llm/settings/deterministic_mirostat.py +45 -0
letta/local_llm/settings/settings.py +72 -0
letta/local_llm/settings/simple.py +28 -0
letta/local_llm/utils.py +265 -0
letta/local_llm/vllm/api.py +63 -0
letta/local_llm/webui/api.py +60 -0
letta/local_llm/webui/legacy_api.py +58 -0
letta/local_llm/webui/legacy_settings.py +23 -0
letta/local_llm/webui/settings.py +24 -0
letta/log.py +76 -0
letta/main.py +437 -0
letta/memory.py +440 -0
letta/metadata.py +884 -0
letta/openai_backcompat/__init__.py +0 -0
letta/openai_backcompat/openai_object.py +437 -0
letta/persistence_manager.py +148 -0
letta/personas/__init__.py +0 -0
letta/personas/examples/anna_pa.txt +13 -0
letta/personas/examples/google_search_persona.txt +15 -0
letta/personas/examples/memgpt_doc.txt +6 -0
letta/personas/examples/memgpt_starter.txt +4 -0
letta/personas/examples/sam.txt +14 -0
letta/personas/examples/sam_pov.txt +14 -0
letta/personas/examples/sam_simple_pov_gpt35.txt +13 -0
letta/personas/examples/sqldb/test.db +0 -0
letta/prompts/__init__.py +0 -0
letta/prompts/gpt_summarize.py +14 -0
letta/prompts/gpt_system.py +26 -0
letta/prompts/system/memgpt_base.txt +49 -0
letta/prompts/system/memgpt_chat.txt +58 -0
letta/prompts/system/memgpt_chat_compressed.txt +13 -0
letta/prompts/system/memgpt_chat_fstring.txt +51 -0
letta/prompts/system/memgpt_doc.txt +50 -0
letta/prompts/system/memgpt_gpt35_extralong.txt +53 -0
letta/prompts/system/memgpt_intuitive_knowledge.txt +31 -0
letta/prompts/system/memgpt_modified_chat.txt +23 -0
letta/pytest.ini +0 -0
letta/schemas/agent.py +117 -0
letta/schemas/api_key.py +21 -0
letta/schemas/block.py +135 -0
letta/schemas/document.py +21 -0
letta/schemas/embedding_config.py +54 -0
letta/schemas/enums.py +35 -0
letta/schemas/job.py +38 -0
letta/schemas/letta_base.py +80 -0
letta/schemas/letta_message.py +175 -0
letta/schemas/letta_request.py +23 -0
letta/schemas/letta_response.py +28 -0
letta/schemas/llm_config.py +54 -0
letta/schemas/memory.py +224 -0
letta/schemas/message.py +727 -0
letta/schemas/openai/chat_completion_request.py +123 -0
letta/schemas/openai/chat_completion_response.py +136 -0
letta/schemas/openai/chat_completions.py +123 -0
letta/schemas/openai/embedding_response.py +11 -0
letta/schemas/openai/openai.py +157 -0
letta/schemas/organization.py +20 -0
letta/schemas/passage.py +80 -0
letta/schemas/source.py +62 -0
letta/schemas/tool.py +143 -0
letta/schemas/usage.py +18 -0
letta/schemas/user.py +33 -0
letta/server/__init__.py +0 -0
letta/server/constants.py +6 -0
letta/server/rest_api/__init__.py +0 -0
letta/server/rest_api/admin/__init__.py +0 -0
letta/server/rest_api/admin/agents.py +21 -0
letta/server/rest_api/admin/tools.py +83 -0
letta/server/rest_api/admin/users.py +98 -0
letta/server/rest_api/app.py +193 -0
letta/server/rest_api/auth/__init__.py +0 -0
letta/server/rest_api/auth/index.py +43 -0
letta/server/rest_api/auth_token.py +22 -0
letta/server/rest_api/interface.py +726 -0
letta/server/rest_api/routers/__init__.py +0 -0
letta/server/rest_api/routers/openai/__init__.py +0 -0
letta/server/rest_api/routers/openai/assistants/__init__.py +0 -0
letta/server/rest_api/routers/openai/assistants/assistants.py +115 -0
letta/server/rest_api/routers/openai/assistants/schemas.py +121 -0
letta/server/rest_api/routers/openai/assistants/threads.py +336 -0
letta/server/rest_api/routers/openai/chat_completions/__init__.py +0 -0
letta/server/rest_api/routers/openai/chat_completions/chat_completions.py +131 -0
letta/server/rest_api/routers/v1/__init__.py +15 -0
letta/server/rest_api/routers/v1/agents.py +543 -0
letta/server/rest_api/routers/v1/blocks.py +73 -0
letta/server/rest_api/routers/v1/jobs.py +46 -0
letta/server/rest_api/routers/v1/llms.py +28 -0
letta/server/rest_api/routers/v1/organizations.py +61 -0
letta/server/rest_api/routers/v1/sources.py +199 -0
letta/server/rest_api/routers/v1/tools.py +103 -0
letta/server/rest_api/routers/v1/users.py +109 -0
letta/server/rest_api/static_files.py +74 -0
letta/server/rest_api/utils.py +69 -0
letta/server/server.py +1995 -0
letta/server/startup.sh +8 -0
letta/server/static_files/assets/index-0cbf7ad5.js +274 -0
letta/server/static_files/assets/index-156816da.css +1 -0
letta/server/static_files/assets/index-486e3228.js +274 -0
letta/server/static_files/favicon.ico +0 -0
letta/server/static_files/index.html +39 -0
letta/server/static_files/memgpt_logo_transparent.png +0 -0
letta/server/utils.py +46 -0
letta/server/ws_api/__init__.py +0 -0
letta/server/ws_api/example_client.py +104 -0
letta/server/ws_api/interface.py +108 -0
letta/server/ws_api/protocol.py +100 -0
letta/server/ws_api/server.py +145 -0
letta/settings.py +165 -0
letta/streaming_interface.py +396 -0
letta/system.py +207 -0
letta/utils.py +1065 -0
letta_nightly-0.1.7.dev20240924104148.dist-info/LICENSE +190 -0
letta_nightly-0.1.7.dev20240924104148.dist-info/METADATA +98 -0
letta_nightly-0.1.7.dev20240924104148.dist-info/RECORD +189 -0
letta_nightly-0.1.7.dev20240924104148.dist-info/WHEEL +4 -0
letta_nightly-0.1.7.dev20240924104148.dist-info/entry_points.txt +3 -0

letta/server/rest_api/routers/openai/chat_completions/chat_completions.py ADDED Viewed

@@ -0,0 +1,131 @@
+import json
+from typing import TYPE_CHECKING
+from fastapi import APIRouter, Body, Depends, HTTPException
+from letta.schemas.enums import MessageRole
+from letta.schemas.letta_message import FunctionCall, LettaMessage
+from letta.schemas.openai.chat_completion_request import ChatCompletionRequest
+from letta.schemas.openai.chat_completion_response import (
+    ChatCompletionResponse,
+    Choice,
+    Message,
+    UsageStatistics,
+)
+# TODO this belongs in a controller!
+from letta.server.rest_api.routers.v1.agents import send_message_to_agent
+from letta.server.rest_api.utils import get_letta_server
+if TYPE_CHECKING:
+    pass
+    from letta.server.server import SyncServer
+    from letta.utils import get_utc_time
+router = APIRouter(prefix="/v1/chat/completions", tags=["chat_completions"])
+@router.post("/", response_model=ChatCompletionResponse)
+async def create_chat_completion(
+    completion_request: ChatCompletionRequest = Body(...),
+    server: "SyncServer" = Depends(get_letta_server),
+):
+    """Send a message to a Letta agent via a /chat/completions completion_request
+    The bearer token will be used to identify the user.
+    The 'user' field in the completion_request should be set to the agent ID.
+    """
+    actor = server.get_current_user()
+    agent_id = completion_request.user
+    if agent_id is None:
+        raise HTTPException(status_code=400, detail="Must pass agent_id in the 'user' field")
+    messages = completion_request.messages
+    if messages is None:
+        raise HTTPException(status_code=400, detail="'messages' field must not be empty")
+    if len(messages) > 1:
+        raise HTTPException(status_code=400, detail="'messages' field must be a list of length 1")
+    if messages[0].role != "user":
+        raise HTTPException(status_code=400, detail="'messages[0].role' must be a 'user'")
+    input_message = completion_request.messages[0]
+    if completion_request.stream:
+        print("Starting streaming OpenAI proxy response")
+        # TODO(charles) support multimodal parts
+        assert isinstance(input_message.content, str)
+        return await send_message_to_agent(
+            server=server,
+            agent_id=agent_id,
+            user_id=actor.id,
+            role=MessageRole(input_message.role),
+            message=input_message.content,
+            # Turn streaming ON
+            stream_steps=True,
+            stream_tokens=True,
+            # Turn on ChatCompletion mode (eg remaps send_message to content)
+            chat_completion_mode=True,
+            return_message_object=False,
+        )
+    else:
+        print("Starting non-streaming OpenAI proxy response")
+        # TODO(charles) support multimodal parts
+        assert isinstance(input_message.content, str)
+        response_messages = await send_message_to_agent(
+            server=server,
+            agent_id=agent_id,
+            user_id=actor.id,
+            role=MessageRole(input_message.role),
+            message=input_message.content,
+            # Turn streaming OFF
+            stream_steps=False,
+            stream_tokens=False,
+            return_message_object=False,
+        )
+        # print(response_messages)
+        # Concatenate all send_message outputs together
+        id = ""
+        visible_message_str = ""
+        created_at = None
+        for letta_msg in response_messages.messages:
+            assert isinstance(letta_msg, LettaMessage)
+            if isinstance(letta_msg, FunctionCall):
+                if letta_msg.name and letta_msg.name == "send_message":
+                    try:
+                        letta_function_call_args = json.loads(letta_msg.arguments)
+                        visible_message_str += letta_function_call_args["message"]
+                        id = letta_msg.id
+                        created_at = letta_msg.date
+                    except:
+                        print(f"Failed to parse Letta message: {str(letta_msg)}")
+                else:
+                    print(f"Skipping function_call: {str(letta_msg)}")
+            else:
+                print(f"Skipping message: {str(letta_msg)}")
+        response = ChatCompletionResponse(
+            id=id,
+            created=created_at if created_at else get_utc_time(),
+            choices=[
+                Choice(
+                    finish_reason="stop",
+                    index=0,
+                    message=Message(
+                        role="assistant",
+                        content=visible_message_str,
+                    ),
+                )
+            ],
+            # TODO add real usage
+            usage=UsageStatistics(
+                completion_tokens=0,
+                prompt_tokens=0,
+                total_tokens=0,
+            ),
+        )
+        return response

letta/server/rest_api/routers/v1/__init__.py ADDED Viewed

@@ -0,0 +1,15 @@
+from letta.server.rest_api.routers.v1.agents import router as agents_router
+from letta.server.rest_api.routers.v1.blocks import router as blocks_router
+from letta.server.rest_api.routers.v1.jobs import router as jobs_router
+from letta.server.rest_api.routers.v1.llms import router as llm_router
+from letta.server.rest_api.routers.v1.sources import router as sources_router
+from letta.server.rest_api.routers.v1.tools import router as tools_router
+ROUTERS = [
+    tools_router,
+    sources_router,
+    agents_router,
+    llm_router,
+    blocks_router,
+    jobs_router,
+]

letta/server/rest_api/routers/v1/agents.py ADDED Viewed

@@ -0,0 +1,543 @@
+import asyncio
+from datetime import datetime
+from typing import Dict, List, Optional, Union
+from fastapi import APIRouter, Body, Depends, HTTPException, Query, status
+from fastapi.responses import JSONResponse, StreamingResponse
+from starlette.responses import StreamingResponse
+from letta.schemas.agent import AgentState, CreateAgent, UpdateAgentState
+from letta.schemas.enums import MessageRole, MessageStreamStatus
+from letta.schemas.letta_message import (
+    LegacyLettaMessage,
+    LettaMessage,
+    LettaMessageUnion,
+)
+from letta.schemas.letta_request import LettaRequest
+from letta.schemas.letta_response import LettaResponse
+from letta.schemas.memory import (
+    ArchivalMemorySummary,
+    BasicBlockMemory,
+    CreateArchivalMemory,
+    Memory,
+    RecallMemorySummary,
+)
+from letta.schemas.message import Message, UpdateMessage
+from letta.schemas.passage import Passage
+from letta.schemas.source import Source
+from letta.server.rest_api.interface import StreamingServerInterface
+from letta.server.rest_api.utils import get_letta_server, sse_async_generator
+from letta.server.server import SyncServer
+from letta.utils import deduplicate
+# These can be forward refs, but because Fastapi needs them at runtime the must be imported normally
+router = APIRouter(prefix="/agents", tags=["agents"])
+@router.get("/", response_model=List[AgentState], operation_id="list_agents")
+def list_agents(
+    server: "SyncServer" = Depends(get_letta_server),
+):
+    """
+    List all agents associated with a given user.
+    This endpoint retrieves a list of all agents and their configurations associated with the specified user ID.
+    """
+    actor = server.get_current_user()
+    return server.list_agents(user_id=actor.id)
+@router.post("/", response_model=AgentState, operation_id="create_agent")
+def create_agent(
+    agent: CreateAgent = Body(...),
+    server: "SyncServer" = Depends(get_letta_server),
+):
+    """
+    Create a new agent with the specified configuration.
+    """
+    actor = server.get_current_user()
+    agent.user_id = actor.id
+    # TODO: sarah make general
+    # TODO: eventually remove this
+    assert agent.memory is not None  # TODO: dont force this, can be None (use default human/person)
+    blocks = agent.memory.get_blocks()
+    agent.memory = BasicBlockMemory(blocks=blocks)
+    return server.create_agent(agent, user_id=actor.id)
+@router.patch("/{agent_id}", response_model=AgentState, operation_id="update_agent")
+def update_agent(
+    agent_id: str,
+    update_agent: UpdateAgentState = Body(...),
+    server: "SyncServer" = Depends(get_letta_server),
+):
+    """Update an exsiting agent"""
+    actor = server.get_current_user()
+    update_agent.id = agent_id
+    return server.update_agent(update_agent, user_id=actor.id)
+@router.get("/{agent_id}", response_model=AgentState, operation_id="get_agent")
+def get_agent_state(
+    agent_id: str,
+    server: "SyncServer" = Depends(get_letta_server),
+):
+    """
+    Get the state of the agent.
+    """
+    actor = server.get_current_user()
+    if not server.ms.get_agent(user_id=actor.id, agent_id=agent_id):
+        # agent does not exist
+        raise HTTPException(status_code=404, detail=f"Agent agent_id={agent_id} not found.")
+    return server.get_agent_state(user_id=actor.id, agent_id=agent_id)
+@router.delete("/{agent_id}", response_model=None, operation_id="delete_agent")
+def delete_agent(
+    agent_id: str,
+    server: "SyncServer" = Depends(get_letta_server),
+):
+    """
+    Delete an agent.
+    """
+    actor = server.get_current_user()
+    return server.delete_agent(user_id=actor.id, agent_id=agent_id)
+@router.get("/{agent_id}/sources", response_model=List[Source], operation_id="get_agent_sources")
+def get_agent_sources(
+    agent_id: str,
+    server: "SyncServer" = Depends(get_letta_server),
+):
+    """
+    Get the sources associated with an agent.
+    """
+    server.get_current_user()
+    return server.list_attached_sources(agent_id)
+@router.get("/{agent_id}/memory/messages", response_model=List[Message], operation_id="list_agent_in_context_messages")
+def get_agent_in_context_messages(
+    agent_id: str,
+    server: "SyncServer" = Depends(get_letta_server),
+):
+    """
+    Retrieve the messages in the context of a specific agent.
+    """
+    return server.get_in_context_messages(agent_id=agent_id)
+@router.get("/{agent_id}/memory", response_model=Memory, operation_id="get_agent_memory")
+def get_agent_memory(
+    agent_id: str,
+    server: "SyncServer" = Depends(get_letta_server),
+):
+    """
+    Retrieve the memory state of a specific agent.
+    This endpoint fetches the current memory state of the agent identified by the user ID and agent ID.
+    """
+    return server.get_agent_memory(agent_id=agent_id)
+@router.patch("/{agent_id}/memory", response_model=Memory, operation_id="update_agent_memory")
+def update_agent_memory(
+    agent_id: str,
+    request: Dict = Body(...),
+    server: "SyncServer" = Depends(get_letta_server),
+):
+    """
+    Update the core memory of a specific agent.
+    This endpoint accepts new memory contents (human and persona) and updates the core memory of the agent identified by the user ID and agent ID.
+    """
+    actor = server.get_current_user()
+    memory = server.update_agent_core_memory(user_id=actor.id, agent_id=agent_id, new_memory_contents=request)
+    return memory
+@router.get("/{agent_id}/memory/recall", response_model=RecallMemorySummary, operation_id="get_agent_recall_memory_summary")
+def get_agent_recall_memory_summary(
+    agent_id: str,
+    server: "SyncServer" = Depends(get_letta_server),
+):
+    """
+    Retrieve the summary of the recall memory of a specific agent.
+    """
+    return server.get_recall_memory_summary(agent_id=agent_id)
+@router.get("/{agent_id}/memory/archival", response_model=ArchivalMemorySummary, operation_id="get_agent_archival_memory_summary")
+def get_agent_archival_memory_summary(
+    agent_id: str,
+    server: "SyncServer" = Depends(get_letta_server),
+):
+    """
+    Retrieve the summary of the archival memory of a specific agent.
+    """
+    return server.get_archival_memory_summary(agent_id=agent_id)
+@router.get("/{agent_id}/archival", response_model=List[Passage], operation_id="list_agent_archival_memory")
+def get_agent_archival_memory(
+    agent_id: str,
+    server: "SyncServer" = Depends(get_letta_server),
+    after: Optional[int] = Query(None, description="Unique ID of the memory to start the query range at."),
+    before: Optional[int] = Query(None, description="Unique ID of the memory to end the query range at."),
+    limit: Optional[int] = Query(None, description="How many results to include in the response."),
+):
+    """
+    Retrieve the memories in an agent's archival memory store (paginated query).
+    """
+    actor = server.get_current_user()
+    # TODO need to add support for non-postgres here
+    # chroma will throw:
+    #     raise ValueError("Cannot run get_all_cursor with chroma")
+    return server.get_agent_archival_cursor(
+        user_id=actor.id,
+        agent_id=agent_id,
+        after=after,
+        before=before,
+        limit=limit,
+    )
+@router.post("/{agent_id}/archival", response_model=List[Passage], operation_id="create_agent_archival_memory")
+def insert_agent_archival_memory(
+    agent_id: str,
+    request: CreateArchivalMemory = Body(...),
+    server: "SyncServer" = Depends(get_letta_server),
+):
+    """
+    Insert a memory into an agent's archival memory store.
+    """
+    actor = server.get_current_user()
+    return server.insert_archival_memory(user_id=actor.id, agent_id=agent_id, memory_contents=request.text)
+# TODO(ethan): query or path parameter for memory_id?
+# @router.delete("/{agent_id}/archival")
+@router.delete("/{agent_id}/archival/{memory_id}", response_model=None, operation_id="delete_agent_archival_memory")
+def delete_agent_archival_memory(
+    agent_id: str,
+    memory_id: str,
+    # memory_id: str = Query(..., description="Unique ID of the memory to be deleted."),
+    server: "SyncServer" = Depends(get_letta_server),
+):
+    """
+    Delete a memory from an agent's archival memory store.
+    """
+    actor = server.get_current_user()
+    server.delete_archival_memory(user_id=actor.id, agent_id=agent_id, memory_id=memory_id)
+    return JSONResponse(status_code=status.HTTP_200_OK, content={"message": f"Memory id={memory_id} successfully deleted"})
+@router.get("/{agent_id}/messages", response_model=Union[List[Message], List[LettaMessageUnion]], operation_id="list_agent_messages")
+def get_agent_messages(
+    agent_id: str,
+    server: "SyncServer" = Depends(get_letta_server),
+    before: Optional[str] = Query(None, description="Message before which to retrieve the returned messages."),
+    limit: int = Query(10, description="Maximum number of messages to retrieve."),
+    msg_object: bool = Query(False, description="If true, returns Message objects. If false, return LettaMessage objects."),
+):
+    """
+    Retrieve message history for an agent.
+    """
+    actor = server.get_current_user()
+    return server.get_agent_recall_cursor(
+        user_id=actor.id,
+        agent_id=agent_id,
+        before=before,
+        limit=limit,
+        reverse=True,
+        return_message_object=msg_object,
+    )
+@router.patch("/{agent_id}/messages/{message_id}", response_model=Message, operation_id="update_agent_message")
+def update_message(
+    agent_id: str,
+    message_id: str,
+    request: UpdateMessage = Body(...),
+    server: "SyncServer" = Depends(get_letta_server),
+):
+    """
+    Update the details of a message associated with an agent.
+    """
+    assert request.id == message_id, f"Message ID mismatch: {request.id} != {message_id}"
+    return server.update_agent_message(agent_id=agent_id, request=request)
+@router.post("/{agent_id}/messages", response_model=LettaResponse, operation_id="create_agent_message")
+async def send_message(
+    agent_id: str,
+    server: SyncServer = Depends(get_letta_server),
+    request: LettaRequest = Body(...),
+):
+    """
+    Process a user message and return the agent's response.
+    This endpoint accepts a message from a user and processes it through the agent.
+    It can optionally stream the response if 'stream_steps' or 'stream_tokens' is set to True.
+    """
+    actor = server.get_current_user()
+    # TODO(charles): support sending multiple messages
+    assert len(request.messages) == 1, f"Multiple messages not supported: {request.messages}"
+    message = request.messages[0]
+    return await send_message_to_agent(
+        server=server,
+        agent_id=agent_id,
+        user_id=actor.id,
+        role=message.role,
+        message=message.text,
+        stream_steps=request.stream_steps,
+        stream_tokens=request.stream_tokens,
+        return_message_object=request.return_message_object,
+    )
+# TODO: move this into server.py?
+async def send_message_to_agent(
+    server: SyncServer,
+    agent_id: str,
+    user_id: str,
+    role: MessageRole,
+    message: str,
+    stream_steps: bool,
+    stream_tokens: bool,
+    return_message_object: bool,  # Should be True for Python Client, False for REST API
+    chat_completion_mode: Optional[bool] = False,
+    timestamp: Optional[datetime] = None,
+    # related to whether or not we return `LettaMessage`s or `Message`s
+) -> Union[StreamingResponse, LettaResponse]:
+    """Split off into a separate function so that it can be imported in the /chat/completion proxy."""
+    # TODO: @charles is this the correct way to handle?
+    include_final_message = True
+    # determine role
+    if role == MessageRole.user:
+        message_func = server.user_message
+    elif role == MessageRole.system:
+        message_func = server.system_message
+    else:
+        raise HTTPException(status_code=500, detail=f"Bad role {role}")
+    if not stream_steps and stream_tokens:
+        raise HTTPException(status_code=400, detail="stream_steps must be 'true' if stream_tokens is 'true'")
+    # For streaming response
+    try:
+        # TODO: move this logic into server.py
+        # Get the generator object off of the agent's streaming interface
+        # This will be attached to the POST SSE request used under-the-hood
+        letta_agent = server._get_or_load_agent(agent_id=agent_id)
+        streaming_interface = letta_agent.interface
+        if not isinstance(streaming_interface, StreamingServerInterface):
+            raise ValueError(f"Agent has wrong type of interface: {type(streaming_interface)}")
+        # Disable token streaming if not OpenAI
+        # TODO: cleanup this logic
+        if server.server_llm_config.model_endpoint_type != "openai" or "inference.memgpt.ai" in server.server_llm_config.model_endpoint:
+            print("Warning: token streaming is only supported for OpenAI models. Setting to False.")
+            stream_tokens = False
+        # Enable token-streaming within the request if desired
+        streaming_interface.streaming_mode = stream_tokens
+        # "chatcompletion mode" does some remapping and ignores inner thoughts
+        streaming_interface.streaming_chat_completion_mode = chat_completion_mode
+        # streaming_interface.allow_assistant_message = stream
+        # streaming_interface.function_call_legacy_mode = stream
+        # Offload the synchronous message_func to a separate thread
+        streaming_interface.stream_start()
+        task = asyncio.create_task(
+            asyncio.to_thread(message_func, user_id=user_id, agent_id=agent_id, message=message, timestamp=timestamp)
+        )
+        if stream_steps:
+            if return_message_object:
+                # TODO implement returning `Message`s in a stream, not just `LettaMessage` format
+                raise NotImplementedError
+            # return a stream
+            return StreamingResponse(
+                sse_async_generator(streaming_interface.get_generator(), finish_message=include_final_message),
+                media_type="text/event-stream",
+            )
+        else:
+            # buffer the stream, then return the list
+            generated_stream = []
+            async for message in streaming_interface.get_generator():
+                assert (
+                    isinstance(message, LettaMessage) or isinstance(message, LegacyLettaMessage) or isinstance(message, MessageStreamStatus)
+                ), type(message)
+                generated_stream.append(message)
+                if message == MessageStreamStatus.done:
+                    break
+            # Get rid of the stream status messages
+            filtered_stream = [d for d in generated_stream if not isinstance(d, MessageStreamStatus)]
+            usage = await task
+            # By default the stream will be messages of type LettaMessage or LettaLegacyMessage
+            # If we want to convert these to Message, we can use the attached IDs
+            # NOTE: we will need to de-duplicate the Messsage IDs though (since Assistant->Inner+Func_Call)
+            # TODO: eventually update the interface to use `Message` and `MessageChunk` (new) inside the deque instead
+            if return_message_object:
+                message_ids = [m.id for m in filtered_stream]
+                message_ids = deduplicate(message_ids)
+                message_objs = [server.get_agent_message(agent_id=agent_id, message_id=m_id) for m_id in message_ids]
+                return LettaResponse(messages=message_objs, usage=usage)
+            else:
+                return LettaResponse(messages=filtered_stream, usage=usage)
+    except HTTPException:
+        raise
+    except Exception as e:
+        print(e)
+        import traceback
+        traceback.print_exc()
+        raise HTTPException(status_code=500, detail=f"{e}")
+##### MISSING #######
+# @router.post("/{agent_id}/command")
+# def run_command(
+# agent_id: "UUID",
+# command: "AgentCommandRequest",
+#
+# server: "SyncServer" = Depends(get_letta_server),
+# ):
+# """
+# Execute a command on a specified agent.
+# This endpoint receives a command to be executed on an agent. It uses the user and agent identifiers to authenticate and route the command appropriately.
+# Raises an HTTPException for any processing errors.
+# """
+# actor = server.get_current_user()
+#
+# response = server.run_command(user_id=actor.id,
+# agent_id=agent_id,
+# command=command.command)
+# return AgentCommandResponse(response=response)
+# @router.get("/{agent_id}/config")
+# def get_agent_config(
+# agent_id: "UUID",
+#
+# server: "SyncServer" = Depends(get_letta_server),
+# ):
+# """
+# Retrieve the configuration for a specific agent.
+# This endpoint fetches the configuration details for a given agent, identified by the user and agent IDs.
+# """
+# actor = server.get_current_user()
+#
+# if not server.ms.get_agent(user_id=actor.id, agent_id=agent_id):
+## agent does not exist
+# raise HTTPException(status_code=404, detail=f"Agent agent_id={agent_id} not found.")
+# agent_state = server.get_agent_config(user_id=actor.id, agent_id=agent_id)
+## get sources
+# attached_sources = server.list_attached_sources(agent_id=agent_id)
+## configs
+# llm_config = LLMConfig(**vars(agent_state.llm_config))
+# embedding_config = EmbeddingConfig(**vars(agent_state.embedding_config))
+# return GetAgentResponse(
+# agent_state=AgentState(
+# id=agent_state.id,
+# name=agent_state.name,
+# user_id=agent_state.user_id,
+# llm_config=llm_config,
+# embedding_config=embedding_config,
+# state=agent_state.state,
+# created_at=int(agent_state.created_at.timestamp()),
+# tools=agent_state.tools,
+# system=agent_state.system,
+# metadata=agent_state._metadata,
+# ),
+# last_run_at=None,  # TODO
+# sources=attached_sources,
+# )
+# @router.patch("/{agent_id}/rename", response_model=GetAgentResponse)
+# def update_agent_name(
+# agent_id: "UUID",
+# agent_rename: AgentRenameRequest,
+#
+# server: "SyncServer" = Depends(get_letta_server),
+# ):
+# """
+# Updates the name of a specific agent.
+# This changes the name of the agent in the database but does NOT edit the agent's persona.
+# """
+# valid_name = agent_rename.agent_name
+# actor = server.get_current_user()
+#
+# agent_state = server.rename_agent(user_id=actor.id, agent_id=agent_id, new_agent_name=valid_name)
+## get sources
+# attached_sources = server.list_attached_sources(agent_id=agent_id)
+# llm_config = LLMConfig(**vars(agent_state.llm_config))
+# embedding_config = EmbeddingConfig(**vars(agent_state.embedding_config))
+# return GetAgentResponse(
+# agent_state=AgentState(
+# id=agent_state.id,
+# name=agent_state.name,
+# user_id=agent_state.user_id,
+# llm_config=llm_config,
+# embedding_config=embedding_config,
+# state=agent_state.state,
+# created_at=int(agent_state.created_at.timestamp()),
+# tools=agent_state.tools,
+# system=agent_state.system,
+# ),
+# last_run_at=None,  # TODO
+# sources=attached_sources,
+# )
+# @router.get("/{agent_id}/archival/all", response_model=GetAgentArchivalMemoryResponse)
+# def get_agent_archival_memory_all(
+# agent_id: "UUID",
+#
+# server: "SyncServer" = Depends(get_letta_server),
+# ):
+# """
+# Retrieve the memories in an agent's archival memory store (non-paginated, returns all entries at once).
+# """
+# actor = server.get_current_user()
+#
+# archival_memories = server.get_all_archival_memories(user_id=actor.id, agent_id=agent_id)
+# print("archival_memories:", archival_memories)
+# archival_memory_objects = [ArchivalMemoryObject(id=passage["id"], contents=passage["contents"]) for passage in archival_memories]
+# return GetAgentArchivalMemoryResponse(archival_memory=archival_memory_objects)