PyPI - tweek - Versions diffs - 0.3.1__py3-none-any.whl → 0.4.1__py3-none-any.whl - Mend

tweek 0.3.1py3-none-any.whl → 0.4.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (61) hide show

tweek/__init__.py +2 -2
tweek/audit.py +2 -2
tweek/cli.py +78 -6605
tweek/cli_config.py +643 -0
tweek/cli_configure.py +413 -0
tweek/cli_core.py +718 -0
tweek/cli_dry_run.py +390 -0
tweek/cli_helpers.py +316 -0
tweek/cli_install.py +1666 -0
tweek/cli_logs.py +301 -0
tweek/cli_mcp.py +148 -0
tweek/cli_memory.py +343 -0
tweek/cli_plugins.py +748 -0
tweek/cli_protect.py +564 -0
tweek/cli_proxy.py +405 -0
tweek/cli_security.py +236 -0
tweek/cli_skills.py +289 -0
tweek/cli_uninstall.py +551 -0
tweek/cli_vault.py +313 -0
tweek/config/allowed_dirs.yaml +16 -17
tweek/config/families.yaml +4 -1
tweek/config/manager.py +17 -0
tweek/config/patterns.yaml +29 -5
tweek/config/templates/config.yaml.template +212 -0
tweek/config/templates/env.template +45 -0
tweek/config/templates/overrides.yaml.template +121 -0
tweek/config/templates/tweek.yaml.template +20 -0
tweek/config/templates.py +136 -0
tweek/config/tiers.yaml +5 -4
tweek/diagnostics.py +112 -32
tweek/hooks/overrides.py +4 -0
tweek/hooks/post_tool_use.py +46 -1
tweek/hooks/pre_tool_use.py +149 -49
tweek/integrations/openclaw.py +84 -0
tweek/licensing.py +1 -1
tweek/mcp/__init__.py +7 -9
tweek/mcp/clients/chatgpt.py +2 -2
tweek/mcp/clients/claude_desktop.py +2 -2
tweek/mcp/clients/gemini.py +2 -2
tweek/mcp/proxy.py +165 -1
tweek/memory/provenance.py +438 -0
tweek/memory/queries.py +2 -0
tweek/memory/safety.py +23 -4
tweek/memory/schemas.py +1 -0
tweek/memory/store.py +101 -71
tweek/plugins/screening/heuristic_scorer.py +1 -1
tweek/security/integrity.py +77 -0
tweek/security/llm_reviewer.py +170 -74
tweek/security/local_reviewer.py +44 -2
tweek/security/model_registry.py +73 -7
tweek/skill_template/overrides-reference.md +1 -1
tweek/skills/context.py +221 -0
tweek/skills/scanner.py +2 -2
{tweek-0.3.1.dist-info → tweek-0.4.1.dist-info}/METADATA +8 -7
{tweek-0.3.1.dist-info → tweek-0.4.1.dist-info}/RECORD +60 -38
tweek/mcp/server.py +0 -320
{tweek-0.3.1.dist-info → tweek-0.4.1.dist-info}/WHEEL +0 -0
{tweek-0.3.1.dist-info → tweek-0.4.1.dist-info}/entry_points.txt +0 -0
{tweek-0.3.1.dist-info → tweek-0.4.1.dist-info}/licenses/LICENSE +0 -0
{tweek-0.3.1.dist-info → tweek-0.4.1.dist-info}/licenses/NOTICE +0 -0
{tweek-0.3.1.dist-info → tweek-0.4.1.dist-info}/top_level.txt +0 -0

tweek/memory/schemas.py CHANGED Viewed

@@ -39,6 +39,7 @@ class ConfidenceAdjustment:
     last_decision: Optional[str]
     adjusted_decision: Optional[str] = None  # suggested decision override
     confidence_score: float = 0.0  # 0.0-1.0 how confident the suggestion is
+    scope: Optional[str] = None  # which scope matched: exact/tool_project/path
 @dataclass

tweek/memory/store.py CHANGED Viewed

@@ -27,6 +27,7 @@ from tweek.memory.safety import (
     MIN_APPROVAL_RATIO,
     MIN_CONFIDENCE_SCORE,
     MIN_DECISION_THRESHOLD,
+    SCOPED_THRESHOLDS,
     compute_suggested_decision,
     is_immune_pattern,
 )
@@ -269,11 +270,19 @@ class MemoryStore:
         current_decision: str = "ask",
         original_severity: str = "medium",
         original_confidence: str = "heuristic",
+        tool_name: Optional[str] = None,
+        project_hash: Optional[str] = None,
     ) -> Optional[ConfidenceAdjustment]:
         """Query memory for a confidence adjustment on a pattern.
-        Returns a ConfidenceAdjustment if memory has enough data,
-        or None if insufficient data / pattern is immune.
+        Uses a narrowest-first scope cascade:
+          1. exact:        pattern + tool + path + project  (threshold: 1)
+          2. tool_project: pattern + tool + project         (threshold: 3)
+          3. path:         pattern + path_prefix            (threshold: 5)
+          4. global:       NEVER — intentionally omitted
+        Returns a ConfidenceAdjustment if memory has enough data at any
+        scope, or None if insufficient data / pattern is immune.
         """
         conn = self._get_connection()
@@ -286,96 +295,117 @@ class MemoryStore:
             )
             return None
-        # Query the confidence view
+        # Build scope cascade: (scope_name, sql_where, params, threshold)
+        scopes = []
+        if tool_name and path_prefix and project_hash:
+            scopes.append((
+                "exact",
+                "pattern_name = ? AND tool_name = ? AND path_prefix = ? AND project_hash = ?",
+                (pattern_name, tool_name, path_prefix, project_hash),
+                SCOPED_THRESHOLDS["exact"],
+            ))
+        if tool_name and project_hash:
+            scopes.append((
+                "tool_project",
+                "pattern_name = ? AND tool_name = ? AND project_hash = ?",
+                (pattern_name, tool_name, project_hash),
+                SCOPED_THRESHOLDS["tool_project"],
+            ))
         if path_prefix:
-            row = conn.execute(
-                """
-                SELECT * FROM pattern_confidence_view
-                WHERE pattern_name = ? AND path_prefix = ?
-                """,
+            scopes.append((
+                "path",
+                "pattern_name = ? AND path_prefix = ?",
                 (pattern_name, path_prefix),
-            ).fetchone()
-        else:
-            row = conn.execute(
-                """
-                SELECT * FROM pattern_confidence_view
-                WHERE pattern_name = ? AND path_prefix IS NULL
-                """,
-                (pattern_name,),
-            ).fetchone()
+                SCOPED_THRESHOLDS["path"],
+            ))
+        # No global fallback — intentionally omitted
-        # Also try without path prefix as fallback
-        if not row and path_prefix:
+        # Try each scope narrowest-first
+        for scope_name, where_clause, params, threshold in scopes:
             row = conn.execute(
-                """
+                f"""
                 SELECT
                     pattern_name,
-                    NULL as path_prefix,
-                    SUM(total_decisions) as total_decisions,
-                    SUM(weighted_approvals) as weighted_approvals,
-                    SUM(weighted_denials) as weighted_denials,
-                    CASE WHEN SUM(weighted_approvals) + SUM(weighted_denials) > 0 THEN
-                        SUM(weighted_approvals) / (SUM(weighted_approvals) + SUM(weighted_denials))
+                    COUNT(*) as total_decisions,
+                    SUM(CASE WHEN user_response = 'approved' THEN decay_weight ELSE 0 END)
+                        as weighted_approvals,
+                    SUM(CASE WHEN user_response = 'denied' THEN decay_weight ELSE 0 END)
+                        as weighted_denials,
+                    CASE WHEN SUM(decay_weight) > 0 THEN
+                        SUM(CASE WHEN user_response = 'approved' THEN decay_weight ELSE 0 END)
+                        / SUM(decay_weight)
                     ELSE 0.5 END as approval_ratio,
-                    MAX(last_decision) as last_decision
-                FROM pattern_confidence_view
-                WHERE pattern_name = ?
+                    MAX(timestamp) as last_decision
+                FROM pattern_decisions
+                WHERE {where_clause} AND decay_weight > 0.01
                 GROUP BY pattern_name
                 """,
-                (pattern_name,),
+                params,
             ).fetchone()
-        if not row:
+            if not row:
+                continue
+            total = row["total_decisions"]
+            weighted_approvals = row["weighted_approvals"] or 0.0
+            weighted_denials = row["weighted_denials"] or 0.0
+            approval_ratio = row["approval_ratio"] or 0.5
+            total_weighted = weighted_approvals + weighted_denials
+            # Check if this scope has enough data
+            if total_weighted < threshold:
+                continue
+            # Compute suggested decision with scope-specific threshold
+            suggested = compute_suggested_decision(
+                current_decision=current_decision,
+                approval_ratio=approval_ratio,
+                total_weighted_decisions=total_weighted,
+                original_severity=original_severity,
+                original_confidence=original_confidence,
+                min_threshold=threshold,
+            )
+            # Confidence score: based on data quantity and consistency
+            confidence_score = 0.0
+            if total_weighted >= threshold:
+                data_factor = min(total_weighted / (threshold * 3), 1.0)
+                ratio_factor = approval_ratio if suggested == "log" else (1 - approval_ratio)
+                confidence_score = data_factor * ratio_factor
+            adjustment = ConfidenceAdjustment(
+                pattern_name=pattern_name,
+                path_prefix=path_prefix,
+                total_decisions=total,
+                weighted_approvals=weighted_approvals,
+                weighted_denials=weighted_denials,
+                approval_ratio=approval_ratio,
+                last_decision=row["last_decision"],
+                adjusted_decision=suggested,
+                confidence_score=confidence_score,
+                scope=scope_name,
+            )
             self._audit(
                 "read", "pattern_decisions",
                 f"{pattern_name}:{path_prefix}",
-                "no_data",
+                f"scope={scope_name}, total={total}, ratio={approval_ratio:.2f}, "
+                f"suggested={suggested}, confidence={confidence_score:.2f}",
             )
-            return None
-        total = row["total_decisions"]
-        weighted_approvals = row["weighted_approvals"] or 0.0
-        weighted_denials = row["weighted_denials"] or 0.0
-        approval_ratio = row["approval_ratio"] or 0.5
-        total_weighted = weighted_approvals + weighted_denials
-        # Compute suggested decision
-        suggested = compute_suggested_decision(
-            current_decision=current_decision,
-            approval_ratio=approval_ratio,
-            total_weighted_decisions=total_weighted,
-            original_severity=original_severity,
-            original_confidence=original_confidence,
-        )
-        # Confidence score: based on data quantity and consistency
-        confidence_score = 0.0
-        if total_weighted >= MIN_DECISION_THRESHOLD:
-            # Scale 0-1 based on how far above threshold and ratio strength
-            data_factor = min(total_weighted / (MIN_DECISION_THRESHOLD * 3), 1.0)
-            ratio_factor = approval_ratio if suggested == "log" else (1 - approval_ratio)
-            confidence_score = data_factor * ratio_factor
-        adjustment = ConfidenceAdjustment(
-            pattern_name=pattern_name,
-            path_prefix=path_prefix,
-            total_decisions=total,
-            weighted_approvals=weighted_approvals,
-            weighted_denials=weighted_denials,
-            approval_ratio=approval_ratio,
-            last_decision=row["last_decision"],
-            adjusted_decision=suggested,
-            confidence_score=confidence_score,
-        )
+            return adjustment
+        # No scope had enough data
         self._audit(
             "read", "pattern_decisions",
             f"{pattern_name}:{path_prefix}",
-            f"total={total}, ratio={approval_ratio:.2f}, suggested={suggested}, "
-            f"confidence={confidence_score:.2f}",
+            "no_data_any_scope",
         )
-        return adjustment
+        return None
     # =====================================================================
     # Source Trust

tweek/plugins/screening/heuristic_scorer.py CHANGED Viewed

@@ -3,7 +3,7 @@ Tweek Heuristic Scorer Screening Plugin
 Lightweight signal-based scoring for confidence-gated LLM escalation.
 Runs between Layer 2 (regex) and Layer 3 (LLM) to detect novel attack
-variants that don't match any of the 259 regex patterns but exhibit
+variants that don't match any of the 262 regex patterns but exhibit
 suspicious characteristics.
 Scoring signals (all local, no network, no LLM):

tweek/security/integrity.py ADDED Viewed

@@ -0,0 +1,77 @@
+#!/usr/bin/env python3
+"""
+Tweek Source File Integrity — Self-Trust for Own Package Files
+Prevents false-positive security warnings when Tweek's hooks screen
+Tweek's own source code (which naturally contains patterns like
+"prompt injection", ".env", "bypass hooks", etc.).
+Security model:
+    - Package-relative: only files physically inside the installed
+      tweek Python package are trusted.
+    - Resolved paths: symlinks and ".." traversal are resolved before
+      comparison, so an attacker cannot trick the check with crafted paths.
+    - Read-only trust: this only skips *screening* of file content that
+      Claude reads.  It does NOT allow execution, writing, or any other
+      privileged action.
+What IS trusted:
+    - Python source (.py), YAML configs (.yaml/.yml), and Markdown (.md)
+      files shipped inside the tweek package directory.
+What is NOT trusted:
+    - User config files (~/.tweek/*)
+    - Downloaded model files (~/.tweek/models/*)
+    - Any file outside the package directory, even if named similarly
+    - Non-allowlisted file extensions (e.g., .onnx, .bin, .pkl)
+"""
+from pathlib import Path
+# Resolve the tweek package root at import time.
+# This file lives at tweek/security/integrity.py, so .parent.parent = tweek/
+_TWEEK_PACKAGE_ROOT: Path = Path(__file__).resolve().parent.parent
+# Only trust files with these extensions — never trust binary/model files
+_TRUSTED_EXTENSIONS: frozenset = frozenset({
+    ".py", ".yaml", ".yml", ".md", ".txt", ".json",
+})
+def is_trusted_tweek_file(file_path: str) -> bool:
+    """Check whether a file is a verified Tweek package source file.
+    A file is trusted if and only if:
+    1. Its fully-resolved path is inside the tweek package directory.
+    2. It has an allowlisted extension (source/config only, no binaries).
+    3. The file actually exists on disk (prevents speculative path trust).
+    Args:
+        file_path: Absolute or relative path to check.
+    Returns:
+        True if the file is a Tweek source file that should skip screening.
+    """
+    if not file_path:
+        return False
+    try:
+        resolved = Path(file_path).resolve()
+        # Must exist — don't trust hypothetical paths
+        if not resolved.is_file():
+            return False
+        # Must have a safe extension
+        if resolved.suffix.lower() not in _TRUSTED_EXTENSIONS:
+            return False
+        # Must be inside the tweek package directory
+        # Uses is_relative_to (Python 3.9+) for safe containment check
+        if not resolved.is_relative_to(_TWEEK_PACKAGE_ROOT):
+            return False
+        return True
+    except (OSError, ValueError, TypeError):
+        return False

tweek 0.3.1__py3-none-any.whl → 0.4.1__py3-none-any.whl

tweek 0.3.1py3-none-any.whl → 0.4.1py3-none-any.whl