PyPI - agmem - Versions diffs - 0.1.1__py3-none-any.whl → 0.1.2__py3-none-any.whl - Mend

agmem 0.1.1py3-none-any.whl → 0.1.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (80) hide show

{agmem-0.1.1.dist-info → agmem-0.1.2.dist-info}/METADATA +20 -3
agmem-0.1.2.dist-info/RECORD +86 -0
memvcs/__init__.py +1 -1
memvcs/cli.py +35 -31
memvcs/commands/__init__.py +9 -9
memvcs/commands/add.py +77 -76
memvcs/commands/blame.py +46 -53
memvcs/commands/branch.py +13 -33
memvcs/commands/checkout.py +27 -32
memvcs/commands/clean.py +18 -23
memvcs/commands/clone.py +4 -1
memvcs/commands/commit.py +40 -39
memvcs/commands/daemon.py +81 -76
memvcs/commands/decay.py +77 -0
memvcs/commands/diff.py +56 -57
memvcs/commands/distill.py +74 -0
memvcs/commands/fsck.py +55 -61
memvcs/commands/garden.py +28 -37
memvcs/commands/graph.py +41 -48
memvcs/commands/init.py +16 -24
memvcs/commands/log.py +25 -40
memvcs/commands/merge.py +16 -28
memvcs/commands/pack.py +129 -0
memvcs/commands/pull.py +4 -1
memvcs/commands/push.py +4 -2
memvcs/commands/recall.py +145 -0
memvcs/commands/reflog.py +13 -22
memvcs/commands/remote.py +1 -0
memvcs/commands/repair.py +66 -0
memvcs/commands/reset.py +23 -33
memvcs/commands/resurrect.py +82 -0
memvcs/commands/search.py +3 -4
memvcs/commands/serve.py +2 -1
memvcs/commands/show.py +66 -36
memvcs/commands/stash.py +34 -34
memvcs/commands/status.py +27 -35
memvcs/commands/tag.py +23 -47
memvcs/commands/test.py +30 -44
memvcs/commands/timeline.py +111 -0
memvcs/commands/tree.py +26 -27
memvcs/commands/verify.py +59 -0
memvcs/commands/when.py +115 -0
memvcs/core/access_index.py +167 -0
memvcs/core/config_loader.py +3 -1
memvcs/core/consistency.py +214 -0
memvcs/core/decay.py +185 -0
memvcs/core/diff.py +158 -143
memvcs/core/distiller.py +277 -0
memvcs/core/gardener.py +164 -132
memvcs/core/hooks.py +48 -14
memvcs/core/knowledge_graph.py +134 -138
memvcs/core/merge.py +248 -171
memvcs/core/objects.py +95 -96
memvcs/core/pii_scanner.py +147 -146
memvcs/core/refs.py +132 -115
memvcs/core/repository.py +174 -164
memvcs/core/schema.py +155 -113
memvcs/core/staging.py +60 -65
memvcs/core/storage/__init__.py +20 -18
memvcs/core/storage/base.py +74 -70
memvcs/core/storage/gcs.py +70 -68
memvcs/core/storage/local.py +42 -40
memvcs/core/storage/s3.py +105 -110
memvcs/core/temporal_index.py +112 -0
memvcs/core/test_runner.py +101 -93
memvcs/core/vector_store.py +41 -35
memvcs/integrations/mcp_server.py +1 -3
memvcs/integrations/web_ui/server.py +25 -26
memvcs/retrieval/__init__.py +22 -0
memvcs/retrieval/base.py +54 -0
memvcs/retrieval/pack.py +128 -0
memvcs/retrieval/recaller.py +105 -0
memvcs/retrieval/strategies.py +314 -0
memvcs/utils/__init__.py +3 -3
memvcs/utils/helpers.py +52 -52
agmem-0.1.1.dist-info/RECORD +0 -67
{agmem-0.1.1.dist-info → agmem-0.1.2.dist-info}/WHEEL +0 -0
{agmem-0.1.1.dist-info → agmem-0.1.2.dist-info}/entry_points.txt +0 -0
{agmem-0.1.1.dist-info → agmem-0.1.2.dist-info}/licenses/LICENSE +0 -0
{agmem-0.1.1.dist-info → agmem-0.1.2.dist-info}/top_level.txt +0 -0

memvcs/core/pii_scanner.py CHANGED Viewed

@@ -10,12 +10,13 @@ from pathlib import Path
 from typing import List, Dict, Any, Optional
 # IPs to ignore (localhost / internal); not reported as PII
-IP_FALSE_POSITIVES = frozenset(['127.0.0.1', '0.0.0.0', '192.168.0.1', '10.0.0.1'])
+IP_FALSE_POSITIVES = frozenset(["127.0.0.1", "0.0.0.0", "192.168.0.1", "10.0.0.1"])
 @dataclass
 class PIIIssue:
     """A detected PII issue."""
     filepath: str
     line_number: int
     issue_type: str
@@ -27,10 +28,11 @@ class PIIIssue:
 @dataclass
 class PIIScanResult:
     """Result of scanning for PII."""
     has_issues: bool
     issues: List[PIIIssue] = field(default_factory=list)
     scanned_files: int = 0
     def add_issue(self, issue: PIIIssue):
         self.issues.append(issue)
         self.has_issues = True
@@ -39,7 +41,7 @@ class PIIScanResult:
 class PIIScanner:
     """
     Scanner for detecting PII and secrets in memory files.
     Detects:
     - API keys and tokens
     - Credit card numbers
@@ -50,122 +52,119 @@ class PIIScanner:
     - Private keys
     - Database connection strings
     """
     # Patterns for detecting various types of PII and secrets
     PATTERNS = {
-        'api_key': {
-            'pattern': re.compile(
-                r'(?i)'
-                r'(?:api[_-]?key|apikey|api[_-]?secret|api[_-]?token|'
-                r'auth[_-]?token|access[_-]?token|bearer[_-]?token|'
-                r'secret[_-]?key|private[_-]?key|password|passwd|pwd)'
+        "api_key": {
+            "pattern": re.compile(
+                r"(?i)"
+                r"(?:api[_-]?key|apikey|api[_-]?secret|api[_-]?token|"
+                r"auth[_-]?token|access[_-]?token|bearer[_-]?token|"
+                r"secret[_-]?key|private[_-]?key|password|passwd|pwd)"
                 r'\s*[:=]\s*["\']?([a-zA-Z0-9_\-]{16,})["\']?',
-                re.MULTILINE
+                re.MULTILINE,
             ),
-            'description': 'API key or secret token detected',
-            'severity': 'high'
+            "description": "API key or secret token detected",
+            "severity": "high",
         },
-        'aws_key': {
-            'pattern': re.compile(r'(?:AKIA|ABIA|ACCA|ASIA)[A-Z0-9]{16}'),
-            'description': 'AWS access key detected',
-            'severity': 'high'
+        "aws_key": {
+            "pattern": re.compile(r"(?:AKIA|ABIA|ACCA|ASIA)[A-Z0-9]{16}"),
+            "description": "AWS access key detected",
+            "severity": "high",
         },
-        'aws_secret': {
-            'pattern': re.compile(
+        "aws_secret": {
+            "pattern": re.compile(
                 r'(?i)aws[_-]?secret[_-]?(?:access[_-]?)?key\s*[:=]\s*["\']?([a-zA-Z0-9+/]{40})["\']?'
             ),
-            'description': 'AWS secret access key detected',
-            'severity': 'high'
+            "description": "AWS secret access key detected",
+            "severity": "high",
         },
-        'private_key': {
-            'pattern': re.compile(
-                r'-----BEGIN (?:RSA |DSA |EC |OPENSSH )?PRIVATE KEY-----'
-            ),
-            'description': 'Private key detected',
-            'severity': 'high'
+        "private_key": {
+            "pattern": re.compile(r"-----BEGIN (?:RSA |DSA |EC |OPENSSH )?PRIVATE KEY-----"),
+            "description": "Private key detected",
+            "severity": "high",
         },
-        'credit_card': {
-            'pattern': re.compile(
-                r'\b(?:4[0-9]{12}(?:[0-9]{3})?|'  # Visa
-                r'5[1-5][0-9]{14}|'               # Mastercard
-                r'3[47][0-9]{13}|'                # Amex
-                r'6(?:011|5[0-9]{2})[0-9]{12})\b' # Discover
+        "credit_card": {
+            "pattern": re.compile(
+                r"\b(?:4[0-9]{12}(?:[0-9]{3})?|"  # Visa
+                r"5[1-5][0-9]{14}|"  # Mastercard
+                r"3[47][0-9]{13}|"  # Amex
+                r"6(?:011|5[0-9]{2})[0-9]{12})\b"  # Discover
             ),
-            'description': 'Credit card number detected',
-            'severity': 'high'
+            "description": "Credit card number detected",
+            "severity": "high",
         },
-        'ssn': {
-            'pattern': re.compile(r'\b[0-9]{3}-[0-9]{2}-[0-9]{4}\b'),
-            'description': 'Social Security Number detected',
-            'severity': 'high'
+        "ssn": {
+            "pattern": re.compile(r"\b[0-9]{3}-[0-9]{2}-[0-9]{4}\b"),
+            "description": "Social Security Number detected",
+            "severity": "high",
         },
-        'email': {
-            'pattern': re.compile(r'\b[A-Za-z0-9._%+-]+@[A-Za-z0-9.-]+\.[A-Z|a-z]{2,}\b'),
-            'description': 'Email address detected',
-            'severity': 'medium'
+        "email": {
+            "pattern": re.compile(r"\b[A-Za-z0-9._%+-]+@[A-Za-z0-9.-]+\.[A-Z|a-z]{2,}\b"),
+            "description": "Email address detected",
+            "severity": "medium",
         },
-        'phone': {
-            'pattern': re.compile(
-                r'\b(?:\+?1[-.\s]?)?\(?[2-9][0-9]{2}\)?[-.\s]?[2-9][0-9]{2}[-.\s]?[0-9]{4}\b'
+        "phone": {
+            "pattern": re.compile(
+                r"\b(?:\+?1[-.\s]?)?\(?[2-9][0-9]{2}\)?[-.\s]?[2-9][0-9]{2}[-.\s]?[0-9]{4}\b"
             ),
-            'description': 'Phone number detected',
-            'severity': 'medium'
+            "description": "Phone number detected",
+            "severity": "medium",
         },
-        'ip_address': {
-            'pattern': re.compile(
-                r'\b(?:(?:25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?)\.){3}'
-                r'(?:25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?)\b'
+        "ip_address": {
+            "pattern": re.compile(
+                r"\b(?:(?:25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?)\.){3}"
+                r"(?:25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?)\b"
             ),
-            'description': 'IP address detected',
-            'severity': 'low'
+            "description": "IP address detected",
+            "severity": "low",
         },
-        'database_url': {
-            'pattern': re.compile(
-                r'(?i)(?:postgres|mysql|mongodb|redis)://[^\s"\'"]+',
-                re.MULTILINE
+        "database_url": {
+            "pattern": re.compile(
+                r'(?i)(?:postgres|mysql|mongodb|redis)://[^\s"\'"]+', re.MULTILINE
             ),
-            'description': 'Database connection string detected',
-            'severity': 'high'
+            "description": "Database connection string detected",
+            "severity": "high",
         },
-        'jwt': {
-            'pattern': re.compile(r'eyJ[A-Za-z0-9_-]+\.eyJ[A-Za-z0-9_-]+\.[A-Za-z0-9_-]+'),
-            'description': 'JWT token detected',
-            'severity': 'high'
+        "jwt": {
+            "pattern": re.compile(r"eyJ[A-Za-z0-9_-]+\.eyJ[A-Za-z0-9_-]+\.[A-Za-z0-9_-]+"),
+            "description": "JWT token detected",
+            "severity": "high",
         },
-        'github_token': {
-            'pattern': re.compile(r'(?:ghp|gho|ghu|ghs|ghr)_[A-Za-z0-9_]{36,}'),
-            'description': 'GitHub token detected',
-            'severity': 'high'
+        "github_token": {
+            "pattern": re.compile(r"(?:ghp|gho|ghu|ghs|ghr)_[A-Za-z0-9_]{36,}"),
+            "description": "GitHub token detected",
+            "severity": "high",
         },
-        'slack_token': {
-            'pattern': re.compile(r'xox[baprs]-[0-9]+-[0-9]+-[a-zA-Z0-9]+'),
-            'description': 'Slack token detected',
-            'severity': 'high'
+        "slack_token": {
+            "pattern": re.compile(r"xox[baprs]-[0-9]+-[0-9]+-[a-zA-Z0-9]+"),
+            "description": "Slack token detected",
+            "severity": "high",
+        },
+        "stripe_key": {
+            "pattern": re.compile(r"(?:sk|pk)_(?:test|live)_[a-zA-Z0-9]{24,}"),
+            "description": "Stripe API key detected",
+            "severity": "high",
         },
-        'stripe_key': {
-            'pattern': re.compile(r'(?:sk|pk)_(?:test|live)_[a-zA-Z0-9]{24,}'),
-            'description': 'Stripe API key detected',
-            'severity': 'high'
-        }
     }
     # Files/patterns to skip
     SKIP_PATTERNS = [
-        r'\.git/',
-        r'\.mem/',
-        r'node_modules/',
-        r'__pycache__/',
-        r'\.pyc$',
-        r'\.pyo$',
+        r"\.git/",
+        r"\.mem/",
+        r"node_modules/",
+        r"__pycache__/",
+        r"\.pyc$",
+        r"\.pyo$",
     ]
     @classmethod
     def _redact(cls, text: str, keep: int = 4) -> str:
         """Partially redact sensitive text for display."""
         if len(text) <= keep * 2:
-            return '*' * len(text)
-        return text[:keep] + '*' * (len(text) - keep * 2) + text[-keep:]
+            return "*" * len(text)
+        return text[:keep] + "*" * (len(text) - keep * 2) + text[-keep:]
     @classmethod
     def _should_skip(cls, filepath: str) -> bool:
         """Check if file should be skipped."""
@@ -173,171 +172,173 @@ class PIIScanner:
             if re.search(pattern, filepath):
                 return True
         return False
     @classmethod
     def scan_content(cls, content: str, filepath: str) -> List[PIIIssue]:
         """
         Scan content for PII.
         Args:
             content: File content to scan
             filepath: Path to the file (for reporting)
         Returns:
             List of PIIIssue objects
         """
         issues = []
-        lines = content.split('\n')
+        lines = content.split("\n")
         for line_num, line in enumerate(lines, 1):
             for pii_type, config in cls.PATTERNS.items():
-                matches = config['pattern'].finditer(line)
+                matches = config["pattern"].finditer(line)
                 for match in matches:
                     matched_text = match.group(0)
                     # Skip common false positives
                     if cls._is_false_positive(pii_type, matched_text, line):
                         continue
-                    issues.append(PIIIssue(
-                        filepath=filepath,
-                        line_number=line_num,
-                        issue_type=pii_type,
-                        description=config['description'],
-                        matched_text=cls._redact(matched_text),
-                        severity=config['severity']
-                    ))
+                    issues.append(
+                        PIIIssue(
+                            filepath=filepath,
+                            line_number=line_num,
+                            issue_type=pii_type,
+                            description=config["description"],
+                            matched_text=cls._redact(matched_text),
+                            severity=config["severity"],
+                        )
+                    )
         return issues
     @classmethod
     def _is_false_positive(cls, pii_type: str, matched_text: str, line: str) -> bool:
         """Check for common false positives."""
         lower_line = line.lower()
         # Skip example/placeholder values
-        if any(x in lower_line for x in ['example', 'placeholder', 'your_', 'xxx', 'sample']):
+        if any(x in lower_line for x in ["example", "placeholder", "your_", "xxx", "sample"]):
             return True
         # Skip comments that are likely documentation
-        if line.strip().startswith('#') and 'example' in lower_line:
+        if line.strip().startswith("#") and "example" in lower_line:
             return True
-        if pii_type == 'ip_address':
+        if pii_type == "ip_address":
             if matched_text in IP_FALSE_POSITIVES:
                 return True
             # Skip version numbers that look like IPs
-            if 'version' in lower_line or 'v.' in lower_line:
+            if "version" in lower_line or "v." in lower_line:
                 return True
         # Email false positives
-        if pii_type == 'email':
+        if pii_type == "email":
             # Skip example domains
-            if any(x in matched_text for x in ['example.com', 'test.com', 'localhost']):
+            if any(x in matched_text for x in ["example.com", "test.com", "localhost"]):
                 return True
         return False
     @classmethod
     def scan_file(cls, filepath: Path) -> List[PIIIssue]:
         """
         Scan a file for PII.
         Args:
             filepath: Path to the file
         Returns:
             List of PIIIssue objects
         """
         if cls._should_skip(str(filepath)):
             return []
         try:
-            content = filepath.read_text(encoding='utf-8', errors='ignore')
+            content = filepath.read_text(encoding="utf-8", errors="ignore")
             return cls.scan_content(content, str(filepath))
         except Exception:
             return []
     @classmethod
     def _get_blob_hash_from_staged(cls, file_info: Any) -> Optional[str]:
         """Get blob hash from StagedFile or dict (staging returns Dict[str, StagedFile])."""
-        if hasattr(file_info, 'blob_hash'):
+        if hasattr(file_info, "blob_hash"):
             return file_info.blob_hash
         if isinstance(file_info, dict):
-            return file_info.get('blob_hash') or file_info.get('hash')
+            return file_info.get("blob_hash") or file_info.get("hash")
         return None
     @classmethod
     def scan_staged_files(cls, repo, staged_files: Dict[str, Any]) -> PIIScanResult:
         """
         Scan staged files for PII.
         Args:
             repo: Repository instance
             staged_files: Dict of staged files with their info
         Returns:
             PIIScanResult with any issues found
         """
         from .objects import Blob
         result = PIIScanResult(has_issues=False)
         for filepath, file_info in staged_files.items():
             if cls._should_skip(filepath):
                 continue
             result.scanned_files += 1
             blob_hash = PIIScanner._get_blob_hash_from_staged(file_info)
             if not blob_hash:
                 continue
             blob = Blob.load(repo.object_store, blob_hash)
             if not blob:
                 continue
             try:
-                content = blob.content.decode('utf-8', errors='ignore')
+                content = blob.content.decode("utf-8", errors="ignore")
             except Exception:
                 continue
             # Scan content
             issues = cls.scan_content(content, filepath)
             for issue in issues:
                 result.add_issue(issue)
         return result
     @classmethod
     def scan_directory(cls, directory: Path, recursive: bool = True) -> PIIScanResult:
         """
         Scan a directory for PII.
         Args:
             directory: Directory to scan
             recursive: Whether to scan recursively
         Returns:
             PIIScanResult with any issues found
         """
         result = PIIScanResult(has_issues=False)
         if recursive:
-            files = directory.rglob('*')
+            files = directory.rglob("*")
         else:
-            files = directory.glob('*')
+            files = directory.glob("*")
         for filepath in files:
             if not filepath.is_file():
                 continue
             if cls._should_skip(str(filepath)):
                 continue
             result.scanned_files += 1
             issues = cls.scan_file(filepath)
             for issue in issues:
                 result.add_issue(issue)
         return result

agmem 0.1.1__py3-none-any.whl → 0.1.2__py3-none-any.whl

agmem 0.1.1py3-none-any.whl → 0.1.2py3-none-any.whl