PyPI - agno - Versions diffs - 2.0.8__py3-none-any.whl → 2.0.9__py3-none-any.whl - Mend

agno 2.0.8py3-none-any.whl → 2.0.9py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (45) hide show

agno/agent/agent.py +2 -2
agno/db/base.py +14 -0
agno/db/dynamo/dynamo.py +107 -27
agno/db/firestore/firestore.py +109 -33
agno/db/gcs_json/gcs_json_db.py +100 -20
agno/db/in_memory/in_memory_db.py +95 -20
agno/db/json/json_db.py +101 -21
agno/db/migrations/v1_to_v2.py +181 -35
agno/db/mongo/mongo.py +251 -26
agno/db/mysql/mysql.py +307 -6
agno/db/postgres/postgres.py +279 -33
agno/db/redis/redis.py +99 -22
agno/db/singlestore/singlestore.py +319 -38
agno/db/sqlite/sqlite.py +339 -23
agno/models/anthropic/claude.py +0 -20
agno/models/huggingface/huggingface.py +2 -1
agno/models/ollama/chat.py +28 -2
agno/models/openai/chat.py +7 -0
agno/models/openai/responses.py +8 -8
agno/os/interfaces/base.py +2 -0
agno/os/interfaces/slack/router.py +50 -10
agno/os/interfaces/slack/slack.py +6 -4
agno/os/interfaces/whatsapp/router.py +7 -4
agno/os/router.py +18 -0
agno/os/utils.py +2 -2
agno/reasoning/azure_ai_foundry.py +2 -2
agno/reasoning/deepseek.py +2 -2
agno/reasoning/groq.py +2 -2
agno/reasoning/ollama.py +2 -2
agno/reasoning/openai.py +2 -2
agno/run/base.py +15 -2
agno/team/team.py +0 -7
agno/tools/mcp_toolbox.py +284 -0
agno/tools/scrapegraph.py +58 -31
agno/tools/whatsapp.py +1 -1
agno/utils/print_response/agent.py +2 -2
agno/utils/print_response/team.py +6 -6
agno/utils/reasoning.py +22 -1
agno/utils/string.py +9 -0
agno/workflow/workflow.py +0 -1
{agno-2.0.8.dist-info → agno-2.0.9.dist-info}/METADATA +4 -1
{agno-2.0.8.dist-info → agno-2.0.9.dist-info}/RECORD +45 -44
{agno-2.0.8.dist-info → agno-2.0.9.dist-info}/WHEEL +0 -0
{agno-2.0.8.dist-info → agno-2.0.9.dist-info}/licenses/LICENSE +0 -0
{agno-2.0.8.dist-info → agno-2.0.9.dist-info}/top_level.txt +0 -0

agno/db/migrations/v1_to_v2.py CHANGED Viewed

@@ -11,7 +11,7 @@ from agno.db.postgres.postgres import PostgresDb
 from agno.db.schemas.memory import UserMemory
 from agno.db.sqlite.sqlite import SqliteDb
 from agno.session import AgentSession, TeamSession, WorkflowSession
-from agno.utils.log import log_error
+from agno.utils.log import log_error, log_info, log_warning
 def convert_v1_metrics_to_v2(metrics_dict: Dict[str, Any]) -> Dict[str, Any]:
@@ -127,22 +127,45 @@ def safe_get_runs_from_memory(memory_data: Any) -> Any:
     if memory_data is None:
         return None
+    runs: Any = []
     # If memory_data is a string, try to parse it as JSON
     if isinstance(memory_data, str):
         try:
             memory_dict = json.loads(memory_data)
             if isinstance(memory_dict, dict):
-                return memory_dict.get("runs")
+                runs = memory_dict.get("runs")
         except (json.JSONDecodeError, AttributeError):
             # If JSON parsing fails, memory_data might just be a string value
             return None
     # If memory_data is already a dict, access runs directly
     elif isinstance(memory_data, dict):
-        return memory_data.get("runs")
-    # For any other type, return None
-    return None
+        runs = memory_data.get("runs")
+    for run in runs or []:
+        # Adjust fields mapping for Agent sessions
+        if run.get("agent_id") is not None:
+            if run.get("team_id") is not None:
+                run.pop("team_id")
+            if run.get("team_session_id") is not None:
+                run["session_id"] = run.pop("team_session_id")
+                if run.get("event"):
+                    run["events"] = [run.pop("event")]
+        # Adjust fields mapping for Team sessions
+        if run.get("team_id") is not None:
+            if run.get("agent_id") is not None:
+                run.pop("agent_id")
+            if member_responses := run.get("member_responses"):
+                for response in member_responses:
+                    if response.get("agent_id") is not None and response.get("team_id") is not None:
+                        response.pop("team_id")
+                    if response.get("agent_id") is not None and response.get("team_session_id") is not None:
+                        response["session_id"] = response.pop("team_session_id")
+                run["member_responses"] = member_responses
+    return runs
 def convert_v1_media_to_v2(media_data: Dict[str, Any]) -> Dict[str, Any]:
@@ -298,6 +321,7 @@ def migrate(
     team_sessions_table_name: Optional[str] = None,
     workflow_sessions_table_name: Optional[str] = None,
     memories_table_name: Optional[str] = None,
+    batch_size: int = 5000,
 ):
     """Given a database connection and table/collection names, parse and migrate the content to corresponding v2 tables/collections.
@@ -308,65 +332,171 @@ def migrate(
         team_sessions_table_name: The name of the team sessions table/collection. If not provided, team sessions will not be migrated.
         workflow_sessions_table_name: The name of the workflow sessions table/collection. If not provided, workflow sessions will not be migrated.
         memories_table_name: The name of the memories table/collection. If not provided, memories will not be migrated.
+        batch_size: Number of records to process in each batch (default: 5000)
     """
     if agent_sessions_table_name:
-        db.migrate_table_from_v1_to_v2(
+        migrate_table_in_batches(
+            db=db,
             v1_db_schema=v1_db_schema,
             v1_table_name=agent_sessions_table_name,
             v1_table_type="agent_sessions",
+            batch_size=batch_size,
         )
     if team_sessions_table_name:
-        db.migrate_table_from_v1_to_v2(
+        migrate_table_in_batches(
+            db=db,
             v1_db_schema=v1_db_schema,
             v1_table_name=team_sessions_table_name,
             v1_table_type="team_sessions",
+            batch_size=batch_size,
         )
     if workflow_sessions_table_name:
-        db.migrate_table_from_v1_to_v2(
+        migrate_table_in_batches(
+            db=db,
             v1_db_schema=v1_db_schema,
             v1_table_name=workflow_sessions_table_name,
             v1_table_type="workflow_sessions",
+            batch_size=batch_size,
         )
     if memories_table_name:
-        db.migrate_table_from_v1_to_v2(
+        migrate_table_in_batches(
+            db=db,
             v1_db_schema=v1_db_schema,
             v1_table_name=memories_table_name,
             v1_table_type="memories",
+            batch_size=batch_size,
         )
-def get_all_table_content(db, db_schema: str, table_name: str) -> list[dict[str, Any]]:
-    """Get all content from the given table/collection"""
+def migrate_table_in_batches(
+    db: Union[PostgresDb, MySQLDb, SqliteDb, MongoDb],
+    v1_db_schema: str,
+    v1_table_name: str,
+    v1_table_type: str,
+    batch_size: int = 5000,
+):
+    log_info(f"Starting migration of table {v1_table_name} (type: {v1_table_type}) with batch size {batch_size}")
+    total_migrated = 0
+    batch_count = 0
+    for batch_content in get_table_content_in_batches(db, v1_db_schema, v1_table_name, batch_size):
+        batch_count += 1
+        batch_size_actual = len(batch_content)
+        log_info(f"Processing batch {batch_count} with {batch_size_actual} records from table {v1_table_name}")
+        # Parse the content into the new format
+        memories: List[UserMemory] = []
+        sessions: Union[List[AgentSession], List[TeamSession], List[WorkflowSession]] = []
+        if v1_table_type == "agent_sessions":
+            sessions = parse_agent_sessions(batch_content)
+        elif v1_table_type == "team_sessions":
+            sessions = parse_team_sessions(batch_content)
+        elif v1_table_type == "workflow_sessions":
+            sessions = parse_workflow_sessions(batch_content)
+        elif v1_table_type == "memories":
+            memories = parse_memories(batch_content)
+        else:
+            raise ValueError(f"Invalid table type: {v1_table_type}")
+        # Insert the batch into the new table
+        if v1_table_type in ["agent_sessions", "team_sessions", "workflow_sessions"]:
+            if sessions:
+                # Clear any existing scoped session state for SQL databases to prevent transaction conflicts
+                if hasattr(db, "Session"):
+                    db.Session.remove()  # type: ignore
+                db.upsert_sessions(sessions)  # type: ignore
+                total_migrated += len(sessions)
+                log_info(f"Bulk upserted {len(sessions)} sessions in batch {batch_count}")
+        elif v1_table_type == "memories":
+            if memories:
+                # Clear any existing scoped session state for SQL databases to prevent transaction conflicts
+                if hasattr(db, "Session"):
+                    db.Session.remove()  # type: ignore
+                db.upsert_memories(memories)
+                total_migrated += len(memories)
+                log_info(f"Bulk upserted {len(memories)} memories in batch {batch_count}")
+        log_info(f"Completed batch {batch_count}: migrated {batch_size_actual} records")
+    log_info(f"✅ Migration completed for table {v1_table_name}: {total_migrated} total records migrated")
+def get_table_content_in_batches(
+    db: Union[PostgresDb, MySQLDb, SqliteDb, MongoDb], db_schema: str, table_name: str, batch_size: int = 5000
+):
+    """Get table content in batches to avoid memory issues with large tables"""
     try:
-        # Check if this is a MongoDB instance
-        if hasattr(db, "database") and hasattr(db, "db_client"):
-            # MongoDB implementation
+        if isinstance(db, MongoDb):
+            # MongoDB implementation with cursor and batching
             collection = db.database[table_name]
-            # Convert MongoDB documents to dictionaries and handle ObjectId
-            documents = list(collection.find({}))
-            # Convert ObjectId to string for compatibility
-            for doc in documents:
+            cursor = collection.find({}).batch_size(batch_size)
+            batch = []
+            for doc in cursor:
+                # Convert ObjectId to string for compatibility
                 if "_id" in doc:
                     doc["_id"] = str(doc["_id"])
-            return documents
-        else:
-            # SQL database implementation (PostgreSQL, MySQL, SQLite)
-            with db.Session() as sess:
-                # Handle empty schema by omitting the schema prefix (needed for SQLite)
-                if db_schema and db_schema.strip():
-                    sql_query = f"SELECT * FROM {db_schema}.{table_name}"
-                else:
-                    sql_query = f"SELECT * FROM {table_name}"
+                batch.append(doc)
+                if len(batch) >= batch_size:
+                    yield batch
+                    batch = []
-                result = sess.execute(text(sql_query))
-                return [row._asdict() for row in result]
+            # Yield remaining items
+            if batch:
+                yield batch
+        else:
+            # SQL database implementations (PostgresDb, MySQLDb, SqliteDb)
+            offset = 0
+            while True:
+                # Create a new session for each batch to avoid transaction conflicts
+                with db.Session() as sess:
+                    # Handle empty schema by omitting the schema prefix (needed for SQLite)
+                    if db_schema and db_schema.strip():
+                        sql_query = f"SELECT * FROM {db_schema}.{table_name} LIMIT {batch_size} OFFSET {offset}"
+                    else:
+                        sql_query = f"SELECT * FROM {table_name} LIMIT {batch_size} OFFSET {offset}"
+                    result = sess.execute(text(sql_query))
+                    batch = [row._asdict() for row in result]
+                    if not batch:
+                        break
+                    yield batch
+                    offset += batch_size
+                    # If batch is smaller than batch_size, we've reached the end
+                    if len(batch) < batch_size:
+                        break
     except Exception as e:
-        log_error(f"Error getting all content from table/collection {table_name}: {e}")
-        return []
+        log_error(f"Error getting batched content from table/collection {table_name}: {e}")
+        return
+def get_all_table_content(db, db_schema: str, table_name: str) -> list[dict[str, Any]]:
+    """Get all content from the given table/collection (legacy method kept for backward compatibility)
+    WARNING: This method loads all data into memory and should not be used for large tables.
+    Use get_table_content_in_batches() for large datasets.
+    """
+    log_warning(
+        f"Loading entire table {table_name} into memory. Consider using get_table_content_in_batches() for large tables, or if you experience any complication."
+    )
+    all_content = []
+    for batch in get_table_content_in_batches(db, db_schema, table_name):
+        all_content.extend(batch)
+    return all_content
 def parse_agent_sessions(v1_content: List[Dict[str, Any]]) -> List[AgentSession]:
@@ -385,7 +515,13 @@ def parse_agent_sessions(v1_content: List[Dict[str, Any]]) -> List[AgentSession]
             "created_at": item.get("created_at"),
             "updated_at": item.get("updated_at"),
         }
-        agent_session = AgentSession.from_dict(session)
+        try:
+            agent_session = AgentSession.from_dict(session)
+        except Exception as e:
+            log_error(f"Error parsing agent session: {e}. This is the complete session that failed: {session}")
+            continue
         if agent_session is not None:
             sessions_v2.append(agent_session)
@@ -408,7 +544,12 @@ def parse_team_sessions(v1_content: List[Dict[str, Any]]) -> List[TeamSession]:
             "created_at": item.get("created_at"),
             "updated_at": item.get("updated_at"),
         }
-        team_session = TeamSession.from_dict(session)
+        try:
+            team_session = TeamSession.from_dict(session)
+        except Exception as e:
+            log_error(f"Error parsing team session: {e}. This is the complete session that failed: {session}")
+            continue
         if team_session is not None:
             sessions_v2.append(team_session)
@@ -433,7 +574,12 @@ def parse_workflow_sessions(v1_content: List[Dict[str, Any]]) -> List[WorkflowSe
             "workflow_name": item.get("workflow_name"),
             "runs": convert_any_metrics_in_data(item.get("runs")),
         }
-        workflow_session = WorkflowSession.from_dict(session)
+        try:
+            workflow_session = WorkflowSession.from_dict(session)
+        except Exception as e:
+            log_error(f"Error parsing workflow session: {e}. This is the complete session that failed: {session}")
+            continue
         if workflow_session is not None:
             sessions_v2.append(workflow_session)

agno 2.0.8__py3-none-any.whl → 2.0.9__py3-none-any.whl

agno 2.0.8py3-none-any.whl → 2.0.9py3-none-any.whl