PyPI - agmem - Versions diffs - 0.1.1__py3-none-any.whl → 0.1.2__py3-none-any.whl - Mend

agmem 0.1.1py3-none-any.whl → 0.1.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (80) hide show

{agmem-0.1.1.dist-info → agmem-0.1.2.dist-info}/METADATA +20 -3
agmem-0.1.2.dist-info/RECORD +86 -0
memvcs/__init__.py +1 -1
memvcs/cli.py +35 -31
memvcs/commands/__init__.py +9 -9
memvcs/commands/add.py +77 -76
memvcs/commands/blame.py +46 -53
memvcs/commands/branch.py +13 -33
memvcs/commands/checkout.py +27 -32
memvcs/commands/clean.py +18 -23
memvcs/commands/clone.py +4 -1
memvcs/commands/commit.py +40 -39
memvcs/commands/daemon.py +81 -76
memvcs/commands/decay.py +77 -0
memvcs/commands/diff.py +56 -57
memvcs/commands/distill.py +74 -0
memvcs/commands/fsck.py +55 -61
memvcs/commands/garden.py +28 -37
memvcs/commands/graph.py +41 -48
memvcs/commands/init.py +16 -24
memvcs/commands/log.py +25 -40
memvcs/commands/merge.py +16 -28
memvcs/commands/pack.py +129 -0
memvcs/commands/pull.py +4 -1
memvcs/commands/push.py +4 -2
memvcs/commands/recall.py +145 -0
memvcs/commands/reflog.py +13 -22
memvcs/commands/remote.py +1 -0
memvcs/commands/repair.py +66 -0
memvcs/commands/reset.py +23 -33
memvcs/commands/resurrect.py +82 -0
memvcs/commands/search.py +3 -4
memvcs/commands/serve.py +2 -1
memvcs/commands/show.py +66 -36
memvcs/commands/stash.py +34 -34
memvcs/commands/status.py +27 -35
memvcs/commands/tag.py +23 -47
memvcs/commands/test.py +30 -44
memvcs/commands/timeline.py +111 -0
memvcs/commands/tree.py +26 -27
memvcs/commands/verify.py +59 -0
memvcs/commands/when.py +115 -0
memvcs/core/access_index.py +167 -0
memvcs/core/config_loader.py +3 -1
memvcs/core/consistency.py +214 -0
memvcs/core/decay.py +185 -0
memvcs/core/diff.py +158 -143
memvcs/core/distiller.py +277 -0
memvcs/core/gardener.py +164 -132
memvcs/core/hooks.py +48 -14
memvcs/core/knowledge_graph.py +134 -138
memvcs/core/merge.py +248 -171
memvcs/core/objects.py +95 -96
memvcs/core/pii_scanner.py +147 -146
memvcs/core/refs.py +132 -115
memvcs/core/repository.py +174 -164
memvcs/core/schema.py +155 -113
memvcs/core/staging.py +60 -65
memvcs/core/storage/__init__.py +20 -18
memvcs/core/storage/base.py +74 -70
memvcs/core/storage/gcs.py +70 -68
memvcs/core/storage/local.py +42 -40
memvcs/core/storage/s3.py +105 -110
memvcs/core/temporal_index.py +112 -0
memvcs/core/test_runner.py +101 -93
memvcs/core/vector_store.py +41 -35
memvcs/integrations/mcp_server.py +1 -3
memvcs/integrations/web_ui/server.py +25 -26
memvcs/retrieval/__init__.py +22 -0
memvcs/retrieval/base.py +54 -0
memvcs/retrieval/pack.py +128 -0
memvcs/retrieval/recaller.py +105 -0
memvcs/retrieval/strategies.py +314 -0
memvcs/utils/__init__.py +3 -3
memvcs/utils/helpers.py +52 -52
agmem-0.1.1.dist-info/RECORD +0 -67
{agmem-0.1.1.dist-info → agmem-0.1.2.dist-info}/WHEEL +0 -0
{agmem-0.1.1.dist-info → agmem-0.1.2.dist-info}/entry_points.txt +0 -0
{agmem-0.1.1.dist-info → agmem-0.1.2.dist-info}/licenses/LICENSE +0 -0
{agmem-0.1.1.dist-info → agmem-0.1.2.dist-info}/top_level.txt +0 -0

memvcs/core/gardener.py CHANGED Viewed

@@ -16,6 +16,7 @@ from collections import defaultdict
 try:
     import yaml
     YAML_AVAILABLE = True
 except ImportError:
     YAML_AVAILABLE = False
@@ -24,6 +25,7 @@ except ImportError:
 @dataclass
 class EpisodeCluster:
     """A cluster of related episodes."""
     topic: str
     episodes: List[Path]
     summary: Optional[str] = None
@@ -33,6 +35,7 @@ class EpisodeCluster:
 @dataclass
 class GardenerConfig:
     """Configuration for the Gardener."""
     threshold: int = 50  # Number of episodic files before triggering
     archive_dir: str = "archive"
     min_cluster_size: int = 3
@@ -45,6 +48,7 @@ class GardenerConfig:
 @dataclass
 class GardenerResult:
     """Result of a gardener run."""
     success: bool
     clusters_found: int
     insights_generated: int
@@ -56,134 +60,158 @@ class GardenerResult:
 class Gardener:
     """
     The Gardener agent that refines memory over time.
     Wakes up when episodic/ files exceed a threshold, clusters them by topic,
     generates summaries, and archives the raw episodes.
     """
     def __init__(self, repo, config: Optional[GardenerConfig] = None):
         """
         Initialize the Gardener.
         Args:
             repo: Repository instance
             config: Optional configuration
         """
         self.repo = repo
         self.config = config or GardenerConfig()
-        self.episodic_dir = repo.root / 'current' / 'episodic'
-        self.semantic_dir = repo.root / 'current' / 'semantic'
+        self.episodic_dir = repo.root / "current" / "episodic"
+        self.semantic_dir = repo.root / "current" / "semantic"
         # Ensure archive_dir stays under current/ (path safety)
         try:
             archive_candidate = (repo.current_dir / self.config.archive_dir).resolve()
             archive_candidate.relative_to(repo.current_dir.resolve())
             self.archive_dir = archive_candidate
         except (ValueError, RuntimeError):
-            self.archive_dir = repo.current_dir / 'archive'
+            self.archive_dir = repo.current_dir / "archive"
     def should_run(self) -> bool:
         """Check if the Gardener should run based on threshold."""
         if not self.episodic_dir.exists():
             return False
-        episode_count = len(list(self.episodic_dir.glob('**/*.md')))
+        episode_count = len(list(self.episodic_dir.glob("**/*.md")))
         return episode_count >= self.config.threshold
     def get_episode_count(self) -> int:
         """Get the current number of episodic files."""
         if not self.episodic_dir.exists():
             return 0
-        return len(list(self.episodic_dir.glob('**/*.md')))
+        return len(list(self.episodic_dir.glob("**/*.md")))
     def load_episodes(self) -> List[Tuple[Path, str]]:
         """
         Load all episodic files.
         Returns:
             List of (path, content) tuples
         """
         episodes = []
         if not self.episodic_dir.exists():
             return episodes
-        for episode_file in self.episodic_dir.glob('**/*.md'):
+        for episode_file in self.episodic_dir.glob("**/*.md"):
             try:
                 content = episode_file.read_text()
                 episodes.append((episode_file, content))
             except Exception:
                 continue
         return episodes
     def cluster_episodes(self, episodes: List[Tuple[Path, str]]) -> List[EpisodeCluster]:
         """
         Cluster episodes by topic using keyword analysis.
         For more sophisticated clustering, this could use embeddings with k-means.
         Args:
             episodes: List of (path, content) tuples
         Returns:
             List of EpisodeCluster objects
         """
         # Simple keyword-based clustering
         keyword_to_episodes: Dict[str, List[Path]] = defaultdict(list)
         # Common programming/tech keywords to look for
         keywords = [
-            'python', 'javascript', 'typescript', 'rust', 'go',
-            'error', 'bug', 'fix', 'debug', 'issue',
-            'api', 'database', 'server', 'client', 'frontend', 'backend',
-            'test', 'testing', 'deploy', 'deployment',
-            'config', 'setup', 'install', 'environment',
-            'performance', 'optimization', 'memory', 'cache',
-            'security', 'auth', 'authentication', 'permission',
-            'user', 'preference', 'setting', 'option',
+            "python",
+            "javascript",
+            "typescript",
+            "rust",
+            "go",
+            "error",
+            "bug",
+            "fix",
+            "debug",
+            "issue",
+            "api",
+            "database",
+            "server",
+            "client",
+            "frontend",
+            "backend",
+            "test",
+            "testing",
+            "deploy",
+            "deployment",
+            "config",
+            "setup",
+            "install",
+            "environment",
+            "performance",
+            "optimization",
+            "memory",
+            "cache",
+            "security",
+            "auth",
+            "authentication",
+            "permission",
+            "user",
+            "preference",
+            "setting",
+            "option",
         ]
         for path, content in episodes:
             content_lower = content.lower()
             found_keywords = []
             for keyword in keywords:
                 if keyword in content_lower:
                     found_keywords.append(keyword)
                     keyword_to_episodes[keyword].append(path)
         # Create clusters from keywords with enough episodes
         clusters = []
         used_episodes = set()
         # Sort by number of episodes (descending)
-        sorted_keywords = sorted(
-            keyword_to_episodes.items(),
-            key=lambda x: len(x[1]),
-            reverse=True
-        )
+        sorted_keywords = sorted(keyword_to_episodes.items(), key=lambda x: len(x[1]), reverse=True)
         for keyword, episode_paths in sorted_keywords:
             if len(clusters) >= self.config.max_clusters:
                 break
             # Filter out already-used episodes
             unused_paths = [p for p in episode_paths if p not in used_episodes]
             if len(unused_paths) >= self.config.min_cluster_size:
-                clusters.append(EpisodeCluster(
-                    topic=keyword,
-                    episodes=unused_paths,
-                    tags=[keyword]
-                ))
+                clusters.append(
+                    EpisodeCluster(topic=keyword, episodes=unused_paths, tags=[keyword])
+                )
                 used_episodes.update(unused_paths)
         return clusters
-    def cluster_episodes_with_embeddings(self, episodes: List[Tuple[Path, str]]) -> List[EpisodeCluster]:
+    def cluster_episodes_with_embeddings(
+        self, episodes: List[Tuple[Path, str]]
+    ) -> List[EpisodeCluster]:
         """
         Cluster episodes using embeddings and k-means.
         Requires scikit-learn and sentence-transformers.
         """
         try:
@@ -192,28 +220,28 @@ class Gardener:
         except ImportError:
             # Fall back to keyword clustering
             return self.cluster_episodes(episodes)
         if len(episodes) < self.config.min_cluster_size:
             return []
         # Generate embeddings
-        model = SentenceTransformer('all-MiniLM-L6-v2')
+        model = SentenceTransformer("all-MiniLM-L6-v2")
         texts = [content[:2000] for _, content in episodes]  # Truncate long texts
         embeddings = model.encode(texts)
         # Determine number of clusters
         n_clusters = min(self.config.max_clusters, len(episodes) // self.config.min_cluster_size)
         n_clusters = max(1, n_clusters)
         # Cluster
         kmeans = KMeans(n_clusters=n_clusters, random_state=42)
         labels = kmeans.fit_predict(embeddings)
         # Group episodes by cluster
         cluster_episodes: Dict[int, List[Tuple[Path, str]]] = defaultdict(list)
         for i, (path, content) in enumerate(episodes):
             cluster_episodes[labels[i]].append((path, content))
         # Create cluster objects
         clusters = []
         for cluster_id, eps in cluster_episodes.items():
@@ -221,31 +249,28 @@ class Gardener:
                 # Extract topic from first few words of first episode
                 first_content = eps[0][1]
                 topic = self._extract_topic(first_content)
-                clusters.append(EpisodeCluster(
-                    topic=topic,
-                    episodes=[p for p, _ in eps]
-                ))
+                clusters.append(EpisodeCluster(topic=topic, episodes=[p for p, _ in eps]))
         return clusters
     def _extract_topic(self, content: str) -> str:
         """Extract a topic label from content."""
         # Take first line or first 50 chars
-        lines = content.strip().split('\n')
+        lines = content.strip().split("\n")
         first_line = lines[0] if lines else content[:50]
         # Clean up
-        topic = first_line.strip('#').strip()
+        topic = first_line.strip("#").strip()
         if len(topic) > 50:
-            topic = topic[:47] + '...'
+            topic = topic[:47] + "..."
         return topic or "general"
     def generate_summary(self, cluster: EpisodeCluster) -> str:
         """
         Generate a summary for a cluster of episodes.
         Uses LLM if configured, otherwise generates a simple summary.
         """
         # Collect content from episodes
@@ -256,40 +281,40 @@ class Gardener:
                 contents.append(content[:1000])  # Truncate
             except Exception:
                 continue
-        combined = '\n---\n'.join(contents)
+        combined = "\n---\n".join(contents)
         # Try LLM summarization
-        if self.config.llm_provider == 'openai' and self.config.llm_model:
+        if self.config.llm_provider == "openai" and self.config.llm_model:
             try:
                 return self._summarize_with_openai(combined, cluster.topic)
             except Exception:
                 pass
         # Fall back to simple summary
         return self._simple_summary(cluster, contents)
     def _summarize_with_openai(self, content: str, topic: str) -> str:
         """Summarize using OpenAI API."""
         import openai
         response = openai.chat.completions.create(
-            model=self.config.llm_model or 'gpt-3.5-turbo',
+            model=self.config.llm_model or "gpt-3.5-turbo",
             messages=[
                 {
-                    'role': 'system',
-                    'content': 'You are a helpful assistant that summarizes conversation logs into actionable insights.'
+                    "role": "system",
+                    "content": "You are a helpful assistant that summarizes conversation logs into actionable insights.",
                 },
                 {
-                    'role': 'user',
-                    'content': f"Summarize these conversation logs about '{topic}' into 2-3 key insights:\n\n{content[:4000]}"
-                }
+                    "role": "user",
+                    "content": f"Summarize these conversation logs about '{topic}' into 2-3 key insights:\n\n{content[:4000]}",
+                },
             ],
-            max_tokens=500
+            max_tokens=500,
         )
         return response.choices[0].message.content
     def _simple_summary(self, cluster: EpisodeCluster, contents: List[str]) -> str:
         """Generate a simple summary without LLM."""
         return f"""# Insights: {cluster.topic.title()}
@@ -305,81 +330,88 @@ class Gardener:
 ---
 *This summary was auto-generated by the Gardener. Review and edit as needed.*
 """
     def write_insight(self, cluster: EpisodeCluster) -> Path:
         """
         Write cluster summary to semantic memory.
         Returns:
             Path to the written insight file
         """
         self.semantic_dir.mkdir(parents=True, exist_ok=True)
         # Generate filename (sanitize topic to avoid path traversal)
-        timestamp = datetime.utcnow().strftime('%Y%m%d')
-        safe_topic = cluster.topic.replace(' ', '-').lower().replace('/', '_').replace('\\', '_')[:30]
+        timestamp = datetime.utcnow().strftime("%Y%m%d")
+        safe_topic = (
+            cluster.topic.replace(" ", "-").lower().replace("/", "_").replace("\\", "_")[:30]
+        )
         filename = f"insight-{safe_topic}-{timestamp}.md"
         insight_path = (self.semantic_dir / filename).resolve()
         try:
             insight_path.relative_to(self.repo.current_dir.resolve())
         except ValueError:
             insight_path = self.semantic_dir / f"insight-{timestamp}.md"
         # Generate frontmatter
         frontmatter = {
-            'schema_version': '1.0',
-            'last_updated': datetime.utcnow().isoformat() + 'Z',
-            'source_agent_id': 'gardener',
-            'memory_type': 'semantic',
-            'tags': cluster.tags + ['auto-generated', 'insight'],
-            'source_episodes': len(cluster.episodes)
+            "schema_version": "1.0",
+            "last_updated": datetime.utcnow().isoformat() + "Z",
+            "source_agent_id": "gardener",
+            "memory_type": "semantic",
+            "tags": cluster.tags + ["auto-generated", "insight"],
+            "source_episodes": len(cluster.episodes),
         }
         # Write file
         if YAML_AVAILABLE:
             import yaml
-            content = f"---\n{yaml.dump(frontmatter, default_flow_style=False)}---\n\n{cluster.summary}"
+            content = (
+                f"---\n{yaml.dump(frontmatter, default_flow_style=False)}---\n\n{cluster.summary}"
+            )
         else:
             content = cluster.summary
         insight_path.write_text(content)
         return insight_path
     def archive_episodes(self, episodes: List[Path]) -> int:
         """
         Archive processed episodes.
         Moves files to archive directory with timestamp prefix.
         Returns:
             Number of files archived
         """
         self.archive_dir.mkdir(parents=True, exist_ok=True)
-        timestamp = datetime.utcnow().strftime('%Y%m%d-%H%M%S')
+        timestamp = datetime.utcnow().strftime("%Y%m%d-%H%M%S")
         archive_subdir = self.archive_dir / timestamp
         archive_subdir.mkdir(exist_ok=True)
         count = 0
         for episode_path in episodes:
             try:
-                safe_name = episode_path.name.replace('..', '_').replace('/', '_').replace('\\', '_')
+                safe_name = (
+                    episode_path.name.replace("..", "_").replace("/", "_").replace("\\", "_")
+                )
                 dest = (archive_subdir / safe_name).resolve()
                 dest.relative_to(self.archive_dir.resolve())
                 shutil.move(str(episode_path), str(dest))
                 count += 1
             except (ValueError, Exception):
                 continue
         return count
     def run(self, force: bool = False) -> GardenerResult:
         """
         Run the Gardener process.
         Args:
             force: Run even if threshold not met
         Returns:
             GardenerResult with operation details
         """
@@ -389,9 +421,9 @@ class Gardener:
                 clusters_found=0,
                 insights_generated=0,
                 episodes_archived=0,
-                message=f"Threshold not met ({self.get_episode_count()}/{self.config.threshold} episodes)"
+                message=f"Threshold not met ({self.get_episode_count()}/{self.config.threshold} episodes)",
             )
         # Load episodes
         episodes = self.load_episodes()
         if not episodes:
@@ -400,67 +432,67 @@ class Gardener:
                 clusters_found=0,
                 insights_generated=0,
                 episodes_archived=0,
-                message="No episodes to process"
+                message="No episodes to process",
             )
         # Cluster episodes
         try:
             clusters = self.cluster_episodes_with_embeddings(episodes)
         except Exception:
             clusters = self.cluster_episodes(episodes)
         if not clusters:
             return GardenerResult(
                 success=True,
                 clusters_found=0,
                 insights_generated=0,
                 episodes_archived=0,
-                message="No clusters could be formed"
+                message="No clusters could be formed",
             )
         # Generate summaries and write insights
         insights_written = 0
         all_archived_episodes = []
         for cluster in clusters:
             try:
                 # Generate summary
                 cluster.summary = self.generate_summary(cluster)
                 # Write insight
                 self.write_insight(cluster)
                 insights_written += 1
                 # Track episodes to archive
                 all_archived_episodes.extend(cluster.episodes)
             except Exception as e:
                 print(f"Warning: Failed to process cluster '{cluster.topic}': {e}")
         # Archive processed episodes
         archived_count = self.archive_episodes(all_archived_episodes)
         # Auto-commit if configured
         commit_hash = None
         if self.config.auto_commit and insights_written > 0:
             try:
                 # Stage new insights
-                for insight_file in self.semantic_dir.glob('insight-*.md'):
-                    rel_path = str(insight_file.relative_to(self.repo.root / 'current'))
+                for insight_file in self.semantic_dir.glob("insight-*.md"):
+                    rel_path = str(insight_file.relative_to(self.repo.root / "current"))
                     self.repo.stage_file(f"current/{rel_path}")
                 # Commit
                 commit_hash = self.repo.commit(
                     f"gardener: synthesized {insights_written} insights from {archived_count} episodes",
-                    {'gardener': True, 'clusters': len(clusters)}
+                    {"gardener": True, "clusters": len(clusters)},
                 )
             except Exception as e:
                 print(f"Warning: Auto-commit failed: {e}")
         return GardenerResult(
             success=True,
             clusters_found=len(clusters),
             insights_generated=insights_written,
             episodes_archived=archived_count,
             commit_hash=commit_hash,
-            message=f"Processed {len(clusters)} clusters, generated {insights_written} insights"
+            message=f"Processed {len(clusters)} clusters, generated {insights_written} insights",
         )

agmem 0.1.1__py3-none-any.whl → 0.1.2__py3-none-any.whl

agmem 0.1.1py3-none-any.whl → 0.1.2py3-none-any.whl