PyPI - chuk-ai-session-manager - Versions diffs - 0.7.1__py3-none-any.whl → 0.8__py3-none-any.whl - Mend

chuk-ai-session-manager 0.7.1py3-none-any.whl → 0.8py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (46) hide show

chuk_ai_session_manager/__init__.py +84 -40
chuk_ai_session_manager/api/__init__.py +1 -1
chuk_ai_session_manager/api/simple_api.py +53 -59
chuk_ai_session_manager/exceptions.py +31 -17
chuk_ai_session_manager/guards/__init__.py +118 -0
chuk_ai_session_manager/guards/bindings.py +217 -0
chuk_ai_session_manager/guards/cache.py +163 -0
chuk_ai_session_manager/guards/manager.py +819 -0
chuk_ai_session_manager/guards/models.py +498 -0
chuk_ai_session_manager/guards/ungrounded.py +159 -0
chuk_ai_session_manager/infinite_conversation.py +86 -79
chuk_ai_session_manager/memory/__init__.py +247 -0
chuk_ai_session_manager/memory/artifacts_bridge.py +469 -0
chuk_ai_session_manager/memory/context_packer.py +347 -0
chuk_ai_session_manager/memory/fault_handler.py +507 -0
chuk_ai_session_manager/memory/manifest.py +307 -0
chuk_ai_session_manager/memory/models.py +1084 -0
chuk_ai_session_manager/memory/mutation_log.py +186 -0
chuk_ai_session_manager/memory/pack_cache.py +206 -0
chuk_ai_session_manager/memory/page_table.py +275 -0
chuk_ai_session_manager/memory/prefetcher.py +192 -0
chuk_ai_session_manager/memory/tlb.py +247 -0
chuk_ai_session_manager/memory/vm_prompts.py +238 -0
chuk_ai_session_manager/memory/working_set.py +574 -0
chuk_ai_session_manager/models/__init__.py +21 -9
chuk_ai_session_manager/models/event_source.py +3 -1
chuk_ai_session_manager/models/event_type.py +10 -1
chuk_ai_session_manager/models/session.py +103 -68
chuk_ai_session_manager/models/session_event.py +69 -68
chuk_ai_session_manager/models/session_metadata.py +9 -10
chuk_ai_session_manager/models/session_run.py +21 -22
chuk_ai_session_manager/models/token_usage.py +76 -76
chuk_ai_session_manager/procedural_memory/__init__.py +70 -0
chuk_ai_session_manager/procedural_memory/formatter.py +407 -0
chuk_ai_session_manager/procedural_memory/manager.py +523 -0
chuk_ai_session_manager/procedural_memory/models.py +371 -0
chuk_ai_session_manager/sample_tools.py +79 -46
chuk_ai_session_manager/session_aware_tool_processor.py +27 -16
chuk_ai_session_manager/session_manager.py +238 -197
chuk_ai_session_manager/session_prompt_builder.py +163 -111
chuk_ai_session_manager/session_storage.py +45 -52
{chuk_ai_session_manager-0.7.1.dist-info → chuk_ai_session_manager-0.8.dist-info}/METADATA +79 -3
chuk_ai_session_manager-0.8.dist-info/RECORD +45 -0
{chuk_ai_session_manager-0.7.1.dist-info → chuk_ai_session_manager-0.8.dist-info}/WHEEL +1 -1
chuk_ai_session_manager-0.7.1.dist-info/RECORD +0 -22
{chuk_ai_session_manager-0.7.1.dist-info → chuk_ai_session_manager-0.8.dist-info}/top_level.txt +0 -0

chuk_ai_session_manager/models/token_usage.py CHANGED Viewed

@@ -5,16 +5,16 @@ Token usage tracking models for the chuk session manager.
 This module provides models for tracking token usage in LLM interactions
 with proper async support.
 """
 from __future__ import annotations
-from datetime import datetime, timezone
-from typing import Dict, Optional, Union, List, Any
-from uuid import uuid4
+from typing import Dict, Optional, Union, Any
 from pydantic import BaseModel, Field, ConfigDict
 import asyncio
 # Try to import tiktoken, but make it optional
 try:
     import tiktoken
     TIKTOKEN_AVAILABLE = True
 except ImportError:
     TIKTOKEN_AVAILABLE = False
@@ -23,7 +23,7 @@ except ImportError:
 class TokenUsage(BaseModel):
     """
     Tracks token usage for LLM interactions.
     Attributes:
         prompt_tokens: Number of tokens in the prompt/input
         completion_tokens: Number of tokens in the completion/output
@@ -31,28 +31,31 @@ class TokenUsage(BaseModel):
         model: The model used for the interaction (helps with pricing calculations)
         estimated_cost_usd: Estimated cost in USD (if pricing info is available)
     """
     model_config = ConfigDict(arbitrary_types_allowed=True)
     prompt_tokens: int = 0
     completion_tokens: int = 0
     total_tokens: int = Field(default=0)
     model: str = ""
     estimated_cost_usd: Optional[float] = None
     def __init__(self, **data):
         super().__init__(**data)
         # Auto-calculate total tokens if not explicitly provided
-        if self.total_tokens == 0 and (self.prompt_tokens > 0 or self.completion_tokens > 0):
+        if self.total_tokens == 0 and (
+            self.prompt_tokens > 0 or self.completion_tokens > 0
+        ):
             self.total_tokens = self.prompt_tokens + self.completion_tokens
         # Auto-calculate estimated cost if model is provided
         if self.model and self.estimated_cost_usd is None:
             self.estimated_cost_usd = self._calculate_cost_sync()
     def _calculate_cost_sync(self) -> float:
         """
         Synchronous implementation of calculate_cost.
         Returns:
             Estimated cost in USD
         """
@@ -62,40 +65,38 @@ class TokenUsage(BaseModel):
             "gpt-4": {"input": 0.03, "output": 0.06},
             "gpt-4-turbo": {"input": 0.01, "output": 0.03},
             "gpt-3.5-turbo": {"input": 0.0005, "output": 0.0015},
             # Claude models
             "claude-3-opus": {"input": 0.015, "output": 0.075},
             "claude-3-sonnet": {"input": 0.003, "output": 0.015},
             "claude-3-haiku": {"input": 0.00025, "output": 0.00125},
             # Fallback for unknown models
-            "default": {"input": 0.001, "output": 0.002}
+            "default": {"input": 0.001, "output": 0.002},
         }
         # Get pricing for this model or use default
         model_pricing = pricing.get(self.model.lower(), pricing["default"])
         # Calculate cost
         input_cost = (self.prompt_tokens / 1000) * model_pricing["input"]
         output_cost = (self.completion_tokens / 1000) * model_pricing["output"]
         return round(input_cost + output_cost, 6)
     async def calculate_cost(self) -> float:
         """
         Async version of calculate_cost.
         Returns:
             Estimated cost in USD
         """
         # Token calculation is CPU-bound, so run in executor
         loop = asyncio.get_running_loop()
         return await loop.run_in_executor(None, self._calculate_cost_sync)
     def _update_sync(self, prompt_tokens: int = 0, completion_tokens: int = 0) -> None:
         """
         Synchronous implementation of update.
         Args:
             prompt_tokens: Additional prompt tokens to add
             completion_tokens: Additional completion tokens to add
@@ -103,14 +104,14 @@ class TokenUsage(BaseModel):
         self.prompt_tokens += prompt_tokens
         self.completion_tokens += completion_tokens
         self.total_tokens = self.prompt_tokens + self.completion_tokens
         if self.model:
             self.estimated_cost_usd = self._calculate_cost_sync()
     async def update(self, prompt_tokens: int = 0, completion_tokens: int = 0) -> None:
         """
         Async version of update.
         Args:
             prompt_tokens: Additional prompt tokens to add
             completion_tokens: Additional completion tokens to add
@@ -118,88 +119,85 @@ class TokenUsage(BaseModel):
         self.prompt_tokens += prompt_tokens
         self.completion_tokens += completion_tokens
         self.total_tokens = self.prompt_tokens + self.completion_tokens
         if self.model:
             self.estimated_cost_usd = await self.calculate_cost()
     @classmethod
     def _from_text_sync(
-        cls,
-        prompt: str,
-        completion: Optional[str] = None,
-        model: str = "gpt-3.5-turbo"
+        cls, prompt: str, completion: Optional[str] = None, model: str = "gpt-3.5-turbo"
     ) -> TokenUsage:
         """
         Synchronous implementation of from_text.
         Args:
             prompt: The prompt/input text
             completion: The completion/output text (optional)
             model: The model name to use for counting and pricing
         Returns:
             A TokenUsage instance with token counts
         """
         prompt_tokens = cls._count_tokens_sync(prompt, model)
-        completion_tokens = cls._count_tokens_sync(completion, model) if completion else 0
+        completion_tokens = (
+            cls._count_tokens_sync(completion, model) if completion else 0
+        )
         return cls(
             prompt_tokens=prompt_tokens,
             completion_tokens=completion_tokens,
-            model=model
+            model=model,
         )
     @classmethod
     async def from_text(
-        cls,
-        prompt: str,
-        completion: Optional[str] = None,
-        model: str = "gpt-3.5-turbo"
+        cls, prompt: str, completion: Optional[str] = None, model: str = "gpt-3.5-turbo"
     ) -> TokenUsage:
         """
         Async version of from_text.
         Args:
             prompt: The prompt/input text
             completion: The completion/output text (optional)
             model: The model name to use for counting and pricing
         Returns:
             A TokenUsage instance with token counts
         """
         # Run token counting in executor since it's CPU-bound
         loop = asyncio.get_running_loop()
         return await loop.run_in_executor(
-            None,
-            lambda: cls._from_text_sync(prompt, completion, model)
+            None, lambda: cls._from_text_sync(prompt, completion, model)
         )
     @staticmethod
-    def _count_tokens_sync(text: Optional[Union[str, Any]], model: str = "gpt-3.5-turbo") -> int:
+    def _count_tokens_sync(
+        text: Optional[Union[str, Any]], model: str = "gpt-3.5-turbo"
+    ) -> int:
         """
         Synchronous implementation of count_tokens.
         Args:
             text: The text to count tokens for
             model: The model name to use for counting
         Returns:
             The number of tokens
         """
         if text is None:
             return 0
         # Convert to string if not already a string
         if not isinstance(text, str):
             try:
                 text = str(text)
             except Exception:
                 return 0
         # Empty string has 0 tokens
         if not text:
             return 0
         if TIKTOKEN_AVAILABLE:
             try:
                 encoding = tiktoken.encoding_for_model(model)
@@ -212,53 +210,54 @@ class TokenUsage(BaseModel):
                 except Exception:
                     # If all else fails, use the approximation
                     pass
         # Simple approximation: ~4 chars per token for English text
         return int(len(text) / 4)
     @staticmethod
-    async def count_tokens(text: Optional[Union[str, Any]], model: str = "gpt-3.5-turbo") -> int:
+    async def count_tokens(
+        text: Optional[Union[str, Any]], model: str = "gpt-3.5-turbo"
+    ) -> int:
         """
         Async version of count_tokens.
         Args:
             text: The text to count tokens for
             model: The model name to use for counting
         Returns:
             The number of tokens
         """
         # Run in executor since token counting is CPU-bound
         loop = asyncio.get_running_loop()
         return await loop.run_in_executor(
-            None,
-            lambda: TokenUsage._count_tokens_sync(text, model)
+            None, lambda: TokenUsage._count_tokens_sync(text, model)
         )
     def __add__(self, other: TokenUsage) -> TokenUsage:
         """
         Add two TokenUsage instances together.
         Args:
             other: Another TokenUsage instance
         Returns:
             A new TokenUsage instance with combined counts
         """
         # Use the model from self if it exists, otherwise use the other's model
         model = self.model if self.model else other.model
         return TokenUsage(
             prompt_tokens=self.prompt_tokens + other.prompt_tokens,
             completion_tokens=self.completion_tokens + other.completion_tokens,
-            model=model
+            model=model,
         )
 class TokenSummary(BaseModel):
     """
     Summarizes token usage across multiple interactions.
     Attributes:
         total_prompt_tokens: Total tokens used in prompts
         total_completion_tokens: Total tokens used in completions
@@ -266,62 +265,63 @@ class TokenSummary(BaseModel):
         usage_by_model: Breakdown of usage by model
         total_estimated_cost_usd: Total estimated cost across all models
     """
     total_prompt_tokens: int = 0
     total_completion_tokens: int = 0
     total_tokens: int = 0
     usage_by_model: Dict[str, TokenUsage] = Field(default_factory=dict)
     total_estimated_cost_usd: float = 0.0
     def _add_usage_sync(self, usage: TokenUsage) -> None:
         """
         Synchronous implementation of add_usage.
         Args:
             usage: The TokenUsage to add
         """
         self.total_prompt_tokens += usage.prompt_tokens
         self.total_completion_tokens += usage.completion_tokens
         self.total_tokens += usage.total_tokens
         if usage.estimated_cost_usd is not None:
             self.total_estimated_cost_usd += usage.estimated_cost_usd
         if usage.model:
             if usage.model in self.usage_by_model:
                 self.usage_by_model[usage.model]._update_sync(
                     prompt_tokens=usage.prompt_tokens,
-                    completion_tokens=usage.completion_tokens
+                    completion_tokens=usage.completion_tokens,
                 )
             else:
                 self.usage_by_model[usage.model] = TokenUsage(
                     prompt_tokens=usage.prompt_tokens,
                     completion_tokens=usage.completion_tokens,
-                    model=usage.model
+                    model=usage.model,
                 )
     async def add_usage(self, usage: TokenUsage) -> None:
         """
         Async version of add_usage.
         Args:
             usage: The TokenUsage to add
         """
         self.total_prompt_tokens += usage.prompt_tokens
         self.total_completion_tokens += usage.completion_tokens
         self.total_tokens += usage.total_tokens
         if usage.estimated_cost_usd is not None:
             self.total_estimated_cost_usd += usage.estimated_cost_usd
         if usage.model:
             if usage.model in self.usage_by_model:
                 await self.usage_by_model[usage.model].update(
                     prompt_tokens=usage.prompt_tokens,
-                    completion_tokens=usage.completion_tokens
+                    completion_tokens=usage.completion_tokens,
                 )
             else:
                 self.usage_by_model[usage.model] = TokenUsage(
                     prompt_tokens=usage.prompt_tokens,
                     completion_tokens=usage.completion_tokens,
-                    model=usage.model
-                )
+                    model=usage.model,
+                )

chuk_ai_session_manager/procedural_memory/__init__.py ADDED Viewed

@@ -0,0 +1,70 @@
+# chuk_ai_session_manager/procedural_memory/__init__.py
+"""
+Procedural Memory System for Tool Usage Learning.
+This module provides:
+- Tool invocation tracing (what was called, when, with what args)
+- Outcome tracking (success/failure + error types)
+- Fix detection (linking failures to subsequent successful fixes)
+- Pattern aggregation (learned "recipes" that work)
+- Session persistence (via chuk-ai-session-manager)
+Memory Hierarchy:
+- L1: Hot cache (in ConversationProcessor) - not this module
+- L2: ToolLog (session tool traces) - this module
+- L3: ToolPatterns (aggregated knowledge) - this module
+Usage:
+    from chuk_ai_session_manager.procedural_memory import (
+        ToolMemoryManager,
+        ToolOutcome,
+    )
+    # Create manager (optionally bound to a session)
+    manager = ToolMemoryManager.create(session_id="abc")
+    # Record a tool call
+    await manager.record_call(
+        tool_name="solver_solve_plan",
+        arguments={"tasks": 10},
+        result={"status": "sat"},
+        outcome=ToolOutcome.SUCCESS,
+        context_goal="schedule F1 testing"
+    )
+    # Get context for paging into model
+    from chuk_ai_session_manager.procedural_memory import ProceduralContextFormatter
+    formatter = ProceduralContextFormatter()
+    context = formatter.format_for_tools(manager, ["solver_solve_plan"])
+"""
+from chuk_ai_session_manager.procedural_memory.models import (
+    ToolOutcome,
+    ToolLogEntry,
+    ToolPattern,
+    ToolFixRelation,
+    ProceduralMemory,
+    ErrorPattern,
+    SuccessPattern,
+)
+from chuk_ai_session_manager.procedural_memory.manager import ToolMemoryManager
+from chuk_ai_session_manager.procedural_memory.formatter import (
+    ProceduralContextFormatter,
+    FormatterConfig,
+)
+__all__ = [
+    # Models
+    "ToolOutcome",
+    "ToolLogEntry",
+    "ToolPattern",
+    "ToolFixRelation",
+    "ProceduralMemory",
+    "ErrorPattern",
+    "SuccessPattern",
+    # Manager
+    "ToolMemoryManager",
+    # Formatter
+    "ProceduralContextFormatter",
+    "FormatterConfig",
+]

chuk-ai-session-manager 0.7.1__py3-none-any.whl → 0.8__py3-none-any.whl

chuk-ai-session-manager 0.7.1py3-none-any.whl → 0.8py3-none-any.whl