PyPI - letta-nightly - Versions diffs - 0.1.7.dev20240924104148__py3-none-any.whl - Mend

letta-nightly 0.1.7.dev20240924104148__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of letta-nightly might be problematic. Click here for more details.

Files changed (189) hide show

letta/__init__.py +24 -0
letta/__main__.py +3 -0
letta/agent.py +1427 -0
letta/agent_store/chroma.py +295 -0
letta/agent_store/db.py +546 -0
letta/agent_store/lancedb.py +177 -0
letta/agent_store/milvus.py +198 -0
letta/agent_store/qdrant.py +201 -0
letta/agent_store/storage.py +188 -0
letta/benchmark/benchmark.py +96 -0
letta/benchmark/constants.py +14 -0
letta/cli/cli.py +689 -0
letta/cli/cli_config.py +1282 -0
letta/cli/cli_load.py +166 -0
letta/client/__init__.py +0 -0
letta/client/admin.py +171 -0
letta/client/client.py +2360 -0
letta/client/streaming.py +90 -0
letta/client/utils.py +61 -0
letta/config.py +484 -0
letta/configs/anthropic.json +13 -0
letta/configs/letta_hosted.json +11 -0
letta/configs/openai.json +12 -0
letta/constants.py +134 -0
letta/credentials.py +140 -0
letta/data_sources/connectors.py +247 -0
letta/embeddings.py +218 -0
letta/errors.py +26 -0
letta/functions/__init__.py +0 -0
letta/functions/function_sets/base.py +174 -0
letta/functions/function_sets/extras.py +132 -0
letta/functions/functions.py +105 -0
letta/functions/schema_generator.py +205 -0
letta/humans/__init__.py +0 -0
letta/humans/examples/basic.txt +1 -0
letta/humans/examples/cs_phd.txt +9 -0
letta/interface.py +314 -0
letta/llm_api/__init__.py +0 -0
letta/llm_api/anthropic.py +383 -0
letta/llm_api/azure_openai.py +155 -0
letta/llm_api/cohere.py +396 -0
letta/llm_api/google_ai.py +468 -0
letta/llm_api/llm_api_tools.py +485 -0
letta/llm_api/openai.py +470 -0
letta/local_llm/README.md +3 -0
letta/local_llm/__init__.py +0 -0
letta/local_llm/chat_completion_proxy.py +279 -0
letta/local_llm/constants.py +31 -0
letta/local_llm/function_parser.py +68 -0
letta/local_llm/grammars/__init__.py +0 -0
letta/local_llm/grammars/gbnf_grammar_generator.py +1324 -0
letta/local_llm/grammars/json.gbnf +26 -0
letta/local_llm/grammars/json_func_calls_with_inner_thoughts.gbnf +32 -0
letta/local_llm/groq/api.py +97 -0
letta/local_llm/json_parser.py +202 -0
letta/local_llm/koboldcpp/api.py +62 -0
letta/local_llm/koboldcpp/settings.py +23 -0
letta/local_llm/llamacpp/api.py +58 -0
letta/local_llm/llamacpp/settings.py +22 -0
letta/local_llm/llm_chat_completion_wrappers/__init__.py +0 -0
letta/local_llm/llm_chat_completion_wrappers/airoboros.py +452 -0
letta/local_llm/llm_chat_completion_wrappers/chatml.py +470 -0
letta/local_llm/llm_chat_completion_wrappers/configurable_wrapper.py +387 -0
letta/local_llm/llm_chat_completion_wrappers/dolphin.py +246 -0
letta/local_llm/llm_chat_completion_wrappers/llama3.py +345 -0
letta/local_llm/llm_chat_completion_wrappers/simple_summary_wrapper.py +156 -0
letta/local_llm/llm_chat_completion_wrappers/wrapper_base.py +11 -0
letta/local_llm/llm_chat_completion_wrappers/zephyr.py +345 -0
letta/local_llm/lmstudio/api.py +100 -0
letta/local_llm/lmstudio/settings.py +29 -0
letta/local_llm/ollama/api.py +88 -0
letta/local_llm/ollama/settings.py +32 -0
letta/local_llm/settings/__init__.py +0 -0
letta/local_llm/settings/deterministic_mirostat.py +45 -0
letta/local_llm/settings/settings.py +72 -0
letta/local_llm/settings/simple.py +28 -0
letta/local_llm/utils.py +265 -0
letta/local_llm/vllm/api.py +63 -0
letta/local_llm/webui/api.py +60 -0
letta/local_llm/webui/legacy_api.py +58 -0
letta/local_llm/webui/legacy_settings.py +23 -0
letta/local_llm/webui/settings.py +24 -0
letta/log.py +76 -0
letta/main.py +437 -0
letta/memory.py +440 -0
letta/metadata.py +884 -0
letta/openai_backcompat/__init__.py +0 -0
letta/openai_backcompat/openai_object.py +437 -0
letta/persistence_manager.py +148 -0
letta/personas/__init__.py +0 -0
letta/personas/examples/anna_pa.txt +13 -0
letta/personas/examples/google_search_persona.txt +15 -0
letta/personas/examples/memgpt_doc.txt +6 -0
letta/personas/examples/memgpt_starter.txt +4 -0
letta/personas/examples/sam.txt +14 -0
letta/personas/examples/sam_pov.txt +14 -0
letta/personas/examples/sam_simple_pov_gpt35.txt +13 -0
letta/personas/examples/sqldb/test.db +0 -0
letta/prompts/__init__.py +0 -0
letta/prompts/gpt_summarize.py +14 -0
letta/prompts/gpt_system.py +26 -0
letta/prompts/system/memgpt_base.txt +49 -0
letta/prompts/system/memgpt_chat.txt +58 -0
letta/prompts/system/memgpt_chat_compressed.txt +13 -0
letta/prompts/system/memgpt_chat_fstring.txt +51 -0
letta/prompts/system/memgpt_doc.txt +50 -0
letta/prompts/system/memgpt_gpt35_extralong.txt +53 -0
letta/prompts/system/memgpt_intuitive_knowledge.txt +31 -0
letta/prompts/system/memgpt_modified_chat.txt +23 -0
letta/pytest.ini +0 -0
letta/schemas/agent.py +117 -0
letta/schemas/api_key.py +21 -0
letta/schemas/block.py +135 -0
letta/schemas/document.py +21 -0
letta/schemas/embedding_config.py +54 -0
letta/schemas/enums.py +35 -0
letta/schemas/job.py +38 -0
letta/schemas/letta_base.py +80 -0
letta/schemas/letta_message.py +175 -0
letta/schemas/letta_request.py +23 -0
letta/schemas/letta_response.py +28 -0
letta/schemas/llm_config.py +54 -0
letta/schemas/memory.py +224 -0
letta/schemas/message.py +727 -0
letta/schemas/openai/chat_completion_request.py +123 -0
letta/schemas/openai/chat_completion_response.py +136 -0
letta/schemas/openai/chat_completions.py +123 -0
letta/schemas/openai/embedding_response.py +11 -0
letta/schemas/openai/openai.py +157 -0
letta/schemas/organization.py +20 -0
letta/schemas/passage.py +80 -0
letta/schemas/source.py +62 -0
letta/schemas/tool.py +143 -0
letta/schemas/usage.py +18 -0
letta/schemas/user.py +33 -0
letta/server/__init__.py +0 -0
letta/server/constants.py +6 -0
letta/server/rest_api/__init__.py +0 -0
letta/server/rest_api/admin/__init__.py +0 -0
letta/server/rest_api/admin/agents.py +21 -0
letta/server/rest_api/admin/tools.py +83 -0
letta/server/rest_api/admin/users.py +98 -0
letta/server/rest_api/app.py +193 -0
letta/server/rest_api/auth/__init__.py +0 -0
letta/server/rest_api/auth/index.py +43 -0
letta/server/rest_api/auth_token.py +22 -0
letta/server/rest_api/interface.py +726 -0
letta/server/rest_api/routers/__init__.py +0 -0
letta/server/rest_api/routers/openai/__init__.py +0 -0
letta/server/rest_api/routers/openai/assistants/__init__.py +0 -0
letta/server/rest_api/routers/openai/assistants/assistants.py +115 -0
letta/server/rest_api/routers/openai/assistants/schemas.py +121 -0
letta/server/rest_api/routers/openai/assistants/threads.py +336 -0
letta/server/rest_api/routers/openai/chat_completions/__init__.py +0 -0
letta/server/rest_api/routers/openai/chat_completions/chat_completions.py +131 -0
letta/server/rest_api/routers/v1/__init__.py +15 -0
letta/server/rest_api/routers/v1/agents.py +543 -0
letta/server/rest_api/routers/v1/blocks.py +73 -0
letta/server/rest_api/routers/v1/jobs.py +46 -0
letta/server/rest_api/routers/v1/llms.py +28 -0
letta/server/rest_api/routers/v1/organizations.py +61 -0
letta/server/rest_api/routers/v1/sources.py +199 -0
letta/server/rest_api/routers/v1/tools.py +103 -0
letta/server/rest_api/routers/v1/users.py +109 -0
letta/server/rest_api/static_files.py +74 -0
letta/server/rest_api/utils.py +69 -0
letta/server/server.py +1995 -0
letta/server/startup.sh +8 -0
letta/server/static_files/assets/index-0cbf7ad5.js +274 -0
letta/server/static_files/assets/index-156816da.css +1 -0
letta/server/static_files/assets/index-486e3228.js +274 -0
letta/server/static_files/favicon.ico +0 -0
letta/server/static_files/index.html +39 -0
letta/server/static_files/memgpt_logo_transparent.png +0 -0
letta/server/utils.py +46 -0
letta/server/ws_api/__init__.py +0 -0
letta/server/ws_api/example_client.py +104 -0
letta/server/ws_api/interface.py +108 -0
letta/server/ws_api/protocol.py +100 -0
letta/server/ws_api/server.py +145 -0
letta/settings.py +165 -0
letta/streaming_interface.py +396 -0
letta/system.py +207 -0
letta/utils.py +1065 -0
letta_nightly-0.1.7.dev20240924104148.dist-info/LICENSE +190 -0
letta_nightly-0.1.7.dev20240924104148.dist-info/METADATA +98 -0
letta_nightly-0.1.7.dev20240924104148.dist-info/RECORD +189 -0
letta_nightly-0.1.7.dev20240924104148.dist-info/WHEEL +4 -0
letta_nightly-0.1.7.dev20240924104148.dist-info/entry_points.txt +3 -0

letta/memory.py ADDED Viewed

@@ -0,0 +1,440 @@
+import datetime
+from abc import ABC, abstractmethod
+from typing import Callable, Dict, List, Tuple, Union
+from letta.constants import MESSAGE_SUMMARY_REQUEST_ACK, MESSAGE_SUMMARY_WARNING_FRAC
+from letta.embeddings import embedding_model, parse_and_chunk_text, query_embedding
+from letta.llm_api.llm_api_tools import create
+from letta.prompts.gpt_summarize import SYSTEM as SUMMARY_PROMPT_SYSTEM
+from letta.schemas.agent import AgentState
+from letta.schemas.memory import Memory
+from letta.schemas.message import Message
+from letta.schemas.passage import Passage
+from letta.utils import (
+    count_tokens,
+    extract_date_from_timestamp,
+    get_local_time,
+    printd,
+    validate_date_format,
+)
+def get_memory_functions(cls: Memory) -> Dict[str, Callable]:
+    """Get memory functions for a memory class"""
+    functions = {}
+    # collect base memory functions (should not be included)
+    base_functions = []
+    for func_name in dir(Memory):
+        funct = getattr(Memory, func_name)
+        if callable(funct):
+            base_functions.append(func_name)
+    for func_name in dir(cls):
+        if func_name.startswith("_") or func_name in ["load", "to_dict"]:  # skip base functions
+            continue
+        if func_name in base_functions:  # dont use BaseMemory functions
+            continue
+        func = getattr(cls, func_name)
+        if not callable(func):  # not a function
+            continue
+        functions[func_name] = func
+    return functions
+def _format_summary_history(message_history: List[Message]):
+    # TODO use existing prompt formatters for this (eg ChatML)
+    return "\n".join([f"{m.role}: {m.text}" for m in message_history])
+def summarize_messages(
+    agent_state: AgentState,
+    message_sequence_to_summarize: List[Message],
+    insert_acknowledgement_assistant_message: bool = True,
+):
+    """Summarize a message sequence using GPT"""
+    # we need the context_window
+    context_window = agent_state.llm_config.context_window
+    summary_prompt = SUMMARY_PROMPT_SYSTEM
+    summary_input = _format_summary_history(message_sequence_to_summarize)
+    summary_input_tkns = count_tokens(summary_input)
+    if summary_input_tkns > MESSAGE_SUMMARY_WARNING_FRAC * context_window:
+        trunc_ratio = (MESSAGE_SUMMARY_WARNING_FRAC * context_window / summary_input_tkns) * 0.8  # For good measure...
+        cutoff = int(len(message_sequence_to_summarize) * trunc_ratio)
+        summary_input = str(
+            [summarize_messages(agent_state, message_sequence_to_summarize=message_sequence_to_summarize[:cutoff])]
+            + message_sequence_to_summarize[cutoff:]
+        )
+    dummy_user_id = agent_state.user_id
+    dummy_agent_id = agent_state.id
+    message_sequence = []
+    message_sequence.append(Message(user_id=dummy_user_id, agent_id=dummy_agent_id, role="system", text=summary_prompt))
+    if insert_acknowledgement_assistant_message:
+        message_sequence.append(Message(user_id=dummy_user_id, agent_id=dummy_agent_id, role="assistant", text=MESSAGE_SUMMARY_REQUEST_ACK))
+    message_sequence.append(Message(user_id=dummy_user_id, agent_id=dummy_agent_id, role="user", text=summary_input))
+    response = create(
+        llm_config=agent_state.llm_config,
+        user_id=agent_state.user_id,
+        messages=message_sequence,
+        stream=False,
+    )
+    printd(f"summarize_messages gpt reply: {response.choices[0]}")
+    reply = response.choices[0].message.content
+    return reply
+class ArchivalMemory(ABC):
+    @abstractmethod
+    def insert(self, memory_string: str):
+        """Insert new archival memory
+        :param memory_string: Memory string to insert
+        :type memory_string: str
+        """
+    @abstractmethod
+    def search(self, query_string, count=None, start=None) -> Tuple[List[str], int]:
+        """Search archival memory
+        :param query_string: Query string
+        :type query_string: str
+        :param count: Number of results to return (None for all)
+        :type count: Optional[int]
+        :param start: Offset to start returning results from (None if 0)
+        :type start: Optional[int]
+        :return: Tuple of (list of results, total number of results)
+        """
+    @abstractmethod
+    def compile(self) -> str:
+        """Convert archival memory into a string representation for a prompt"""
+    @abstractmethod
+    def count(self) -> int:
+        """Count the number of memories in the archival memory"""
+class RecallMemory(ABC):
+    @abstractmethod
+    def text_search(self, query_string, count=None, start=None):
+        """Search messages that match query_string in recall memory"""
+    @abstractmethod
+    def date_search(self, start_date, end_date, count=None, start=None):
+        """Search messages between start_date and end_date in recall memory"""
+    @abstractmethod
+    def compile(self) -> str:
+        """Convert recall memory into a string representation for a prompt"""
+    @abstractmethod
+    def count(self) -> int:
+        """Count the number of memories in the recall memory"""
+    @abstractmethod
+    def insert(self, message: Message):
+        """Insert message into recall memory"""
+class DummyRecallMemory(RecallMemory):
+    """Dummy in-memory version of a recall memory database (eg run on MongoDB)
+    Recall memory here is basically just a full conversation history with the user.
+    Queryable via string matching, or date matching.
+    Recall Memory: The AI's capability to search through past interactions,
+    effectively allowing it to 'remember' prior engagements with a user.
+    """
+    def __init__(self, message_database=None, restrict_search_to_summaries=False):
+        self._message_logs = [] if message_database is None else message_database  # consists of full message dicts
+        # If true, the pool of messages that can be queried are the automated summaries only
+        # (generated when the conversation window needs to be shortened)
+        self.restrict_search_to_summaries = restrict_search_to_summaries
+    def __len__(self):
+        return len(self._message_logs)
+    def count(self) -> int:
+        return len(self)
+    def compile(self) -> str:
+        # don't dump all the conversations, just statistics
+        system_count = user_count = assistant_count = function_count = other_count = 0
+        for msg in self._message_logs:
+            role = msg["message"]["role"]
+            if role == "system":
+                system_count += 1
+            elif role == "user":
+                user_count += 1
+            elif role == "assistant":
+                assistant_count += 1
+            elif role == "function":
+                function_count += 1
+            else:
+                other_count += 1
+        memory_str = (
+            f"Statistics:"
+            + f"\n{len(self._message_logs)} total messages"
+            + f"\n{system_count} system"
+            + f"\n{user_count} user"
+            + f"\n{assistant_count} assistant"
+            + f"\n{function_count} function"
+            + f"\n{other_count} other"
+        )
+        return f"\n### RECALL MEMORY ###" + f"\n{memory_str}"
+    def insert(self, message):
+        raise NotImplementedError("This should be handled by the PersistenceManager, recall memory is just a search layer on top")
+    def text_search(self, query_string, count=None, start=None):
+        # in the dummy version, run an (inefficient) case-insensitive match search
+        message_pool = [d for d in self._message_logs if d["message"]["role"] not in ["system", "function"]]
+        start = 0 if start is None else int(start)
+        count = 0 if count is None else int(count)
+        printd(
+            f"recall_memory.text_search: searching for {query_string} (c={count}, s={start}) in {len(self._message_logs)} total messages"
+        )
+        matches = [
+            d for d in message_pool if d["message"]["content"] is not None and query_string.lower() in d["message"]["content"].lower()
+        ]
+        printd(f"recall_memory - matches:\n{matches[start:start+count]}")
+        # start/count support paging through results
+        if start is not None and count is not None:
+            return matches[start : start + count], len(matches)
+        elif start is None and count is not None:
+            return matches[:count], len(matches)
+        elif start is not None and count is None:
+            return matches[start:], len(matches)
+        else:
+            return matches, len(matches)
+    def date_search(self, start_date, end_date, count=None, start=None):
+        message_pool = [d for d in self._message_logs if d["message"]["role"] not in ["system", "function"]]
+        # First, validate the start_date and end_date format
+        if not validate_date_format(start_date) or not validate_date_format(end_date):
+            raise ValueError("Invalid date format. Expected format: YYYY-MM-DD")
+        # Convert dates to datetime objects for comparison
+        start_date_dt = datetime.datetime.strptime(start_date, "%Y-%m-%d")
+        end_date_dt = datetime.datetime.strptime(end_date, "%Y-%m-%d")
+        # Next, match items inside self._message_logs
+        matches = [
+            d
+            for d in message_pool
+            if start_date_dt <= datetime.datetime.strptime(extract_date_from_timestamp(d["timestamp"]), "%Y-%m-%d") <= end_date_dt
+        ]
+        # start/count support paging through results
+        start = 0 if start is None else int(start)
+        count = 0 if count is None else int(count)
+        if start is not None and count is not None:
+            return matches[start : start + count], len(matches)
+        elif start is None and count is not None:
+            return matches[:count], len(matches)
+        elif start is not None and count is None:
+            return matches[start:], len(matches)
+        else:
+            return matches, len(matches)
+class BaseRecallMemory(RecallMemory):
+    """Recall memory based on base functions implemented by storage connectors"""
+    def __init__(self, agent_state, restrict_search_to_summaries=False):
+        # If true, the pool of messages that can be queried are the automated summaries only
+        # (generated when the conversation window needs to be shortened)
+        self.restrict_search_to_summaries = restrict_search_to_summaries
+        from letta.agent_store.storage import StorageConnector
+        self.agent_state = agent_state
+        # create embedding model
+        self.embed_model = embedding_model(agent_state.embedding_config)
+        self.embedding_chunk_size = agent_state.embedding_config.embedding_chunk_size
+        # create storage backend
+        self.storage = StorageConnector.get_recall_storage_connector(user_id=agent_state.user_id, agent_id=agent_state.id)
+        # TODO: have some mechanism for cleanup otherwise will lead to OOM
+        self.cache = {}
+    def get_all(self, start=0, count=None):
+        start = 0 if start is None else int(start)
+        count = 0 if count is None else int(count)
+        results = self.storage.get_all(start, count)
+        results_json = [message.to_openai_dict() for message in results]
+        return results_json, len(results)
+    def text_search(self, query_string, count=None, start=None):
+        start = 0 if start is None else int(start)
+        count = 0 if count is None else int(count)
+        results = self.storage.query_text(query_string, count, start)
+        results_json = [message.to_openai_dict_search_results() for message in results]
+        return results_json, len(results)
+    def date_search(self, start_date, end_date, count=None, start=None):
+        start = 0 if start is None else int(start)
+        count = 0 if count is None else int(count)
+        results = self.storage.query_date(start_date, end_date, count, start)
+        results_json = [message.to_openai_dict_search_results() for message in results]
+        return results_json, len(results)
+    def compile(self) -> str:
+        total = self.storage.size()
+        system_count = self.storage.size(filters={"role": "system"})
+        user_count = self.storage.size(filters={"role": "user"})
+        assistant_count = self.storage.size(filters={"role": "assistant"})
+        function_count = self.storage.size(filters={"role": "function"})
+        other_count = total - (system_count + user_count + assistant_count + function_count)
+        memory_str = (
+            f"Statistics:"
+            + f"\n{total} total messages"
+            + f"\n{system_count} system"
+            + f"\n{user_count} user"
+            + f"\n{assistant_count} assistant"
+            + f"\n{function_count} function"
+            + f"\n{other_count} other"
+        )
+        return f"\n### RECALL MEMORY ###" + f"\n{memory_str}"
+    def insert(self, message: Message):
+        self.storage.insert(message)
+    def insert_many(self, messages: List[Message]):
+        self.storage.insert_many(messages)
+    def save(self):
+        self.storage.save()
+    def __len__(self):
+        return self.storage.size()
+    def count(self) -> int:
+        return len(self)
+class EmbeddingArchivalMemory(ArchivalMemory):
+    """Archival memory with embedding based search"""
+    def __init__(self, agent_state: AgentState, top_k: int = 100):
+        """Init function for archival memory
+        :param archival_memory_database: name of dataset to pre-fill archival with
+        :type archival_memory_database: str
+        """
+        from letta.agent_store.storage import StorageConnector
+        self.top_k = top_k
+        self.agent_state = agent_state
+        # create embedding model
+        self.embed_model = embedding_model(agent_state.embedding_config)
+        if agent_state.embedding_config.embedding_chunk_size is None:
+            raise ValueError(f"Must set {agent_state.embedding_config.embedding_chunk_size}")
+        else:
+            self.embedding_chunk_size = agent_state.embedding_config.embedding_chunk_size
+        # create storage backend
+        self.storage = StorageConnector.get_archival_storage_connector(user_id=agent_state.user_id, agent_id=agent_state.id)
+        # TODO: have some mechanism for cleanup otherwise will lead to OOM
+        self.cache = {}
+    def create_passage(self, text, embedding):
+        return Passage(
+            user_id=self.agent_state.user_id,
+            agent_id=self.agent_state.id,
+            text=text,
+            embedding=embedding,
+            embedding_config=self.agent_state.embedding_config,
+        )
+    def save(self):
+        """Save the index to disk"""
+        self.storage.save()
+    def insert(self, memory_string, return_ids=False) -> Union[bool, List[str]]:
+        """Embed and save memory string"""
+        if not isinstance(memory_string, str):
+            raise TypeError("memory must be a string")
+        try:
+            passages = []
+            # breakup string into passages
+            for text in parse_and_chunk_text(memory_string, self.embedding_chunk_size):
+                embedding = self.embed_model.get_text_embedding(text)
+                # fixing weird bug where type returned isn't a list, but instead is an object
+                # eg: embedding={'object': 'list', 'data': [{'object': 'embedding', 'embedding': [-0.0071973633, -0.07893023,
+                if isinstance(embedding, dict):
+                    try:
+                        embedding = embedding["data"][0]["embedding"]
+                    except (KeyError, IndexError):
+                        # TODO as a fallback, see if we can find any lists in the payload
+                        raise TypeError(
+                            f"Got back an unexpected payload from text embedding function, type={type(embedding)}, value={embedding}"
+                        )
+                passages.append(self.create_passage(text, embedding))
+            # grab the return IDs before the list gets modified
+            ids = [str(p.id) for p in passages]
+            # insert passages
+            self.storage.insert_many(passages)
+            if return_ids:
+                return ids
+            else:
+                return True
+        except Exception as e:
+            print("Archival insert error", e)
+            raise e
+    def search(self, query_string, count=None, start=None):
+        """Search query string"""
+        start = 0 if start is None else int(start)
+        count = self.top_k if count is None else int(count)
+        if not isinstance(query_string, str):
+            return TypeError("query must be a string")
+        try:
+            if query_string not in self.cache:
+                # self.cache[query_string] = self.retriever.retrieve(query_string)
+                query_vec = query_embedding(self.embed_model, query_string)
+                self.cache[query_string] = self.storage.query(query_string, query_vec, top_k=self.top_k)
+            end = min(count + start, len(self.cache[query_string]))
+            results = self.cache[query_string][start:end]
+            results = [{"timestamp": get_local_time(), "content": node.text} for node in results]
+            return results, len(results)
+        except Exception as e:
+            print("Archival search error", e)
+            raise e
+    def compile(self) -> str:
+        limit = 10
+        passages = []
+        for passage in list(self.storage.get_all(limit=limit)):  # TODO: only get first 10
+            passages.append(str(passage.text))
+        memory_str = "\n".join(passages)
+        return f"\n### ARCHIVAL MEMORY ###" + f"\n{memory_str}" + f"\nSize: {self.storage.size()}"
+    def __len__(self):
+        return self.storage.size()
+    def count(self) -> int:
+        return len(self)