PyPI - vigil-codeintel - Versions diffs - 0.1.0__py3-none-any.whl - Mend

vigil-codeintel 0.1.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (131) hide show

vigil_codeintel-0.1.0.dist-info/METADATA +780 -0
vigil_codeintel-0.1.0.dist-info/RECORD +131 -0
vigil_codeintel-0.1.0.dist-info/WHEEL +5 -0
vigil_codeintel-0.1.0.dist-info/entry_points.txt +3 -0
vigil_codeintel-0.1.0.dist-info/licenses/LICENSE +21 -0
vigil_codeintel-0.1.0.dist-info/top_level.txt +3 -0
vigil_forensic/__init__.py +224 -0
vigil_forensic/_git_utils.py +178 -0
vigil_forensic/_shared.py +510 -0
vigil_forensic/_stubs.py +156 -0
vigil_forensic/gate_checks/__init__.py +1 -0
vigil_forensic/gate_checks/_ast_helpers.py +629 -0
vigil_forensic/gate_checks/_deployment_detector.py +573 -0
vigil_forensic/gate_checks/atomic_write_checks.py +1143 -0
vigil_forensic/gate_checks/authority_checks.py +95 -0
vigil_forensic/gate_checks/boundary_breach_checks.py +202 -0
vigil_forensic/gate_checks/broad_except_checks.py +301 -0
vigil_forensic/gate_checks/broad_except_hidden_sentinel_checks.py +365 -0
vigil_forensic/gate_checks/common.py +253 -0
vigil_forensic/gate_checks/config_safety_checks.py +704 -0
vigil_forensic/gate_checks/config_ssot_checks.py +78 -0
vigil_forensic/gate_checks/conflict_checks.py +193 -0
vigil_forensic/gate_checks/context_fallback_checks.py +697 -0
vigil_forensic/gate_checks/context_health_checks.py +289 -0
vigil_forensic/gate_checks/contract_shape_drift_checks.py +459 -0
vigil_forensic/gate_checks/dirty_baseline_check.py +274 -0
vigil_forensic/gate_checks/duplication_checks.py +387 -0
vigil_forensic/gate_checks/embedded_string_checks.py +123 -0
vigil_forensic/gate_checks/empty_output_checks.py +87 -0
vigil_forensic/gate_checks/encoding_checks.py +847 -0
vigil_forensic/gate_checks/export_completeness_checks.py +156 -0
vigil_forensic/gate_checks/fallback_checks.py +41 -0
vigil_forensic/gate_checks/file_proliferation_checks.py +171 -0
vigil_forensic/gate_checks/fix_without_test_checks.py +69 -0
vigil_forensic/gate_checks/forensic_cluster_runners/__init__.py +9 -0
vigil_forensic/gate_checks/forensic_cluster_runners/_helpers.py +71 -0
vigil_forensic/gate_checks/forensic_cluster_runners/advanced_checks.py +322 -0
vigil_forensic/gate_checks/forensic_cluster_runners/core.py +273 -0
vigil_forensic/gate_checks/forensic_cluster_runners/integrity_checks.py +203 -0
vigil_forensic/gate_checks/forensic_cluster_runners/quality_checks.py +666 -0
vigil_forensic/gate_checks/forensic_clusters/__init__.py +193 -0
vigil_forensic/gate_checks/forensic_clusters/allowlist.py +426 -0
vigil_forensic/gate_checks/forensic_clusters/allowlist_writer.py +302 -0
vigil_forensic/gate_checks/forensic_clusters/api_protocol.py +231 -0
vigil_forensic/gate_checks/forensic_clusters/async_quality.py +1156 -0
vigil_forensic/gate_checks/forensic_clusters/code_style.py +808 -0
vigil_forensic/gate_checks/forensic_clusters/core.py +319 -0
vigil_forensic/gate_checks/forensic_clusters/data_quality.py +763 -0
vigil_forensic/gate_checks/forensic_clusters/dead_code.py +480 -0
vigil_forensic/gate_checks/forensic_clusters/edit_mutation.py +842 -0
vigil_forensic/gate_checks/forensic_clusters/exception_boundary.py +240 -0
vigil_forensic/gate_checks/forensic_clusters/legacy_debt.py +556 -0
vigil_forensic/gate_checks/forensic_clusters/static_analysis.py +834 -0
vigil_forensic/gate_checks/forensic_clusters/structural_quality.py +298 -0
vigil_forensic/gate_checks/god_object_zones_checks.py +173 -0
vigil_forensic/gate_checks/hallucination_checks.py +566 -0
vigil_forensic/gate_checks/hunter_artifact_completeness_check.py +139 -0
vigil_forensic/gate_checks/implementation_overfit_checks.py +380 -0
vigil_forensic/gate_checks/import_integrity_checks.py +233 -0
vigil_forensic/gate_checks/imports_in_function_checks.py +283 -0
vigil_forensic/gate_checks/ml_checks.py +318 -0
vigil_forensic/gate_checks/performance_checks.py +106 -0
vigil_forensic/gate_checks/project_specific_runner.py +691 -0
vigil_forensic/gate_checks/provider_capability_checks.py +73 -0
vigil_forensic/gate_checks/refactor_completeness_checks.py +274 -0
vigil_forensic/gate_checks/reliability_checks.py +389 -0
vigil_forensic/gate_checks/reporting_checks.py +55 -0
vigil_forensic/gate_checks/runtime_behavior_checks.py +220 -0
vigil_forensic/gate_checks/security_injection_checks.py +332 -0
vigil_forensic/gate_checks/semantic_intent_checks.py +139 -0
vigil_forensic/gate_checks/size_complexity_checks.py +336 -0
vigil_forensic/gate_checks/stuck_feature_flag_checks.py +354 -0
vigil_forensic/gate_checks/syntax_validity_checks.py +217 -0
vigil_forensic/gate_checks/temporal_freshness_checks.py +79 -0
vigil_forensic/gate_checks/test_quality_checks.py +946 -0
vigil_forensic/gate_checks/testing_checks.py +149 -0
vigil_forensic/gate_checks/toctou_checks.py +367 -0
vigil_forensic/gate_checks/type_checking_checks.py +316 -0
vigil_forensic/gate_models.py +392 -0
vigil_forensic/gate_packs/__init__.py +1 -0
vigil_forensic/gate_packs/universal.py +179 -0
vigil_forensic/gate_profile.json +31 -0
vigil_forensic/gate_registry.py +21 -0
vigil_forensic/language_profiles.py +219 -0
vigil_forensic/meta_findings.py +207 -0
vigil_forensic/self_audit.py +725 -0
vigil_forensic/source_analysis.py +175 -0
vigil_mapper/__init__.py +103 -0
vigil_mapper/_ast_helpers_minimal.py +229 -0
vigil_mapper/_extract_imports_impl.py +123 -0
vigil_mapper/_file_count_guard.py +129 -0
vigil_mapper/_git_utils.py +178 -0
vigil_mapper/_runtime_ast.py +438 -0
vigil_mapper/_runtime_dispatch.py +137 -0
vigil_mapper/_seed_helpers.py +82 -0
vigil_mapper/authority_builder.py +1102 -0
vigil_mapper/cli_entry.py +731 -0
vigil_mapper/conflict_builder.py +818 -0
vigil_mapper/data_contract_builder.py +446 -0
vigil_mapper/findings_builder.py +716 -0
vigil_mapper/fingerprint.py +53 -0
vigil_mapper/hotspot_builder.py +539 -0
vigil_mapper/map_common.py +449 -0
vigil_mapper/map_errors.py +55 -0
vigil_mapper/map_models.py +431 -0
vigil_mapper/map_models_ext.py +206 -0
vigil_mapper/map_models_findings.py +130 -0
vigil_mapper/map_storage.py +455 -0
vigil_mapper/parse_cache.py +795 -0
vigil_mapper/refactor_boundary_builder.py +266 -0
vigil_mapper/runtime_builder.py +527 -0
vigil_mapper/runtime_tracer.py +243 -0
vigil_mapper/runtime_tracer_entry.py +199 -0
vigil_mapper/semantic_diff.py +71 -0
vigil_mapper/source_adapters/__init__.py +109 -0
vigil_mapper/source_adapters/_base.py +264 -0
vigil_mapper/source_adapters/_ir.py +156 -0
vigil_mapper/source_adapters/_lexer.py +309 -0
vigil_mapper/source_adapters/_patterns.py +212 -0
vigil_mapper/source_adapters/_treesitter.py +182 -0
vigil_mapper/source_adapters/go.py +553 -0
vigil_mapper/source_adapters/java.py +541 -0
vigil_mapper/source_adapters/javascript.py +626 -0
vigil_mapper/source_adapters/python.py +325 -0
vigil_mapper/source_adapters/typescript.py +749 -0
vigil_mapper/structural_builder.py +586 -0
vigil_mcp/__init__.py +1 -0
vigil_mcp/_jobs.py +587 -0
vigil_mcp/_paths.py +93 -0
vigil_mcp/forensic_server.py +419 -0
vigil_mcp/map_server.py +452 -0

vigil_forensic/gate_checks/provider_capability_checks.py ADDED Viewed

@@ -0,0 +1,73 @@
+"""Provider capability gate check.
+Detects executor provider capability mismatches before gate-monitored runs.
+Registered in gate_registry.py before tool_hook_coverage_checks.
+"""
+from __future__ import annotations
+from vigil_forensic._shared import GateCategory, GateCheckResult, GateImpact, GateSeverity
+from vigil_forensic.gate_models import PostExecGateContext
+from .common import build_check_result, build_finding
+import logging
+_log = logging.getLogger(__name__)
+__all__ = ["check_provider_capabilities"]
+def check_provider_capabilities(ctx: PostExecGateContext) -> GateCheckResult:
+    """Check executor provider capabilities against gate requirements.
+    - PC01: Gemini executor uses trace-file hooks (not stream) -- WARN so that
+      tool_hook_coverage gate does not BLOCK on zero hook-event count.
+    - PC02: executor_provider missing from metadata -- soft WARN.
+    """
+    findings = []
+    executor_provider = str(
+        ctx.control_task_metadata.get("executor_provider") or ""
+    ).strip()
+    if executor_provider == "gemini":
+        findings.append(
+            build_finding(
+                check_id="PC01_gemini_hook_events_in_trace",
+                category=GateCategory.CONTRACT,
+                title="Gemini executor: hook events go to trace file, not JSON stream",
+                severity=GateSeverity.LOW,
+                impact=GateImpact.REVISE,
+                summary=(
+                    "Gemini executor writes hook events to the trace file, not the "
+                    "JSON stream. tool_hook_coverage gate counts will be 0 -- expected."
+                ),
+                recommendation="No action needed. tool_hook_coverage gate should not BLOCK on Gemini runs.",
+                repair_kind='refactor',
+                executor_action='Address finding details',
+                proof_required='Issue fixed',
+                allowlist_allowed=False,
+            )
+        )
+    if not executor_provider:
+        findings.append(
+            build_finding(
+                check_id="PC02_executor_provider_unknown",
+                category=GateCategory.CONTRACT,
+                title="executor_provider metadata missing -- cannot validate capabilities",
+                severity=GateSeverity.LOW,
+                impact=GateImpact.REVISE,
+                summary="executor_provider key absent from control task metadata.",
+                recommendation="Ensure pocketcoder_executor.py writes executor_provider to control task metadata.",
+                repair_kind='refactor',
+                executor_action='Address finding details',
+                proof_required='Issue fixed',
+                allowlist_allowed=False,
+            )
+        )
+    return build_check_result(
+        check_id="provider_capability",
+        category=GateCategory.CONTRACT,
+        findings=findings,
+    )

vigil_forensic/gate_checks/refactor_completeness_checks.py ADDED Viewed

@@ -0,0 +1,274 @@
+"""Refactor completeness forensic gate.
+refactor.partial_rename: detect AI artifact where a symbol was renamed in some
+files but the old name persists in others — i.e. an incomplete rename.
+Detection approach (v1 — static, no git history required):
+  1. Walk all touched .py files, extract public function/class names via AST.
+  2. For every pair of names across different files, compute Levenshtein distance.
+  3. If distance <= 2 and the names are not identical, emit a
+     refactor.partial_rename_candidate finding (MEDIUM / WARN).
+Fails open: AST/IO errors -> skip file, never crash.
+Allowlist supported: similar names can be legitimate (overloads, aliases).
+"""
+from __future__ import annotations
+import ast
+import logging
+from vigil_forensic._shared import (
+    EvidenceReference,
+    GateCategory,
+    GateImpact,
+    GateSeverity,
+    RepairKind,
+)
+from vigil_forensic.gate_models import PostExecGateContext
+from ..source_analysis import is_source_file
+from .common import build_check_result, build_finding, normalize_path
+from ._ast_helpers import parse_python_source_or_emit_finding
+import re
+_log = logging.getLogger(__name__)
+# ---------------------------------------------------------------------------
+# FP-mitigation constants
+# ---------------------------------------------------------------------------
+# Names shorter than this are too generic to flag as partial renames.
+_MIN_NAME_LENGTH = 6
+# Levenshtein ratio floor: if edit_distance / max(len_a, len_b) > this, names
+# are not similar enough to warrant a finding.
+_MAX_SIMILARITY_RATIO = 0.3
+# O(n²) guard: if total public names across all touched files exceeds this,
+# sample only the first N names and emit a note.
+_MAX_TOTAL_NAMES = 200
+# Hard cap on emitted findings per run.
+_MAX_FINDINGS = 20
+# Pattern matching intentional versioned names like MyClass_v1 / MyClass_v2.
+_VERSION_SUFFIX_RE = re.compile(r"_v\d+$")
+# ---------------------------------------------------------------------------
+# Levenshtein distance (stdlib-only, no external deps)
+# ---------------------------------------------------------------------------
+def _levenshtein(a: str, b: str) -> int:
+    """Return the Levenshtein edit distance between *a* and *b*."""
+    if a == b:
+        return 0
+    m, n = len(a), len(b)
+    if m < n:
+        a, b, m, n = b, a, n, m
+    # Single-row DP.
+    prev = list(range(n + 1))
+    for i in range(1, m + 1):
+        curr = [i] + [0] * n
+        for j in range(1, n + 1):
+            cost = 0 if a[i - 1] == b[j - 1] else 1
+            curr[j] = min(
+                prev[j] + 1,       # deletion
+                curr[j - 1] + 1,   # insertion
+                prev[j - 1] + cost,  # substitution
+            )
+        prev = curr
+    return prev[n]
+# ---------------------------------------------------------------------------
+# AST helper: extract public top-level names
+# ---------------------------------------------------------------------------
+def _extract_public_names(
+    content: str,
+    *,
+    rel_path: str = "",
+    emit_finding=None,
+) -> list[str]:
+    """Return public (non-dunder, non-private) function and class names at
+    module or class level from *content*.
+    B4 (2026-04-23): on SyntaxError, emit ``meta.syntax_parse_error`` via the
+    shared helper (if ``emit_finding`` supplied) instead of silently returning
+    ``[]``.
+    """
+    tree = parse_python_source_or_emit_finding(
+        content,
+        rel_path=rel_path,
+        emit_finding=emit_finding,
+        emitting_gate="refactor_completeness",
+    )
+    if tree is None:
+        return []
+    names: list[str] = []
+    for node in ast.walk(tree):
+        if isinstance(node, (ast.FunctionDef, ast.AsyncFunctionDef, ast.ClassDef)):
+            name: str = node.name
+            if not name.startswith("_"):
+                names.append(name)
+    return names
+# ---------------------------------------------------------------------------
+# Main gate runner
+# ---------------------------------------------------------------------------
+def run_refactor_completeness_checks(ctx: PostExecGateContext):
+    """Detect partial renames across touched .py files.
+    For each pair of public names (name_a from file_a, name_b from file_b):
+      - Skip identical names.
+      - If Levenshtein(name_a, name_b) <= 2: emit MEDIUM / WARN finding.
+    The check operates on ctx.touched_files (not ctx.changed_files_observed)
+    so it works even without git diff context.
+    """
+    findings = []
+    # Build map: normalized_path -> list[public_name]
+    file_names: dict[str, list[str]] = {}
+    for raw_path in ctx.touched_files:
+        normalized = normalize_path(raw_path)
+        if not is_source_file(normalized):
+            continue
+        abs_path = ctx.project_dir / normalized
+        try:
+            content = abs_path.read_text(encoding="utf-8")
+        except (OSError, UnicodeDecodeError) as exc:
+            _log.debug("refactor_completeness: cannot read %s: %s", normalized, exc)
+            continue
+        public_names = _extract_public_names(
+            content,
+            rel_path=normalized,
+            emit_finding=findings.append,
+        )
+        if public_names:
+            file_names[normalized] = public_names
+    # O(n²) guard: cap total public names to avoid quadratic blowup.
+    total_names = sum(len(v) for v in file_names.values())
+    _partial_scan = total_names > _MAX_TOTAL_NAMES
+    if _partial_scan:
+        _log.debug(
+            "refactor_completeness: total public names %d > %d cap; "
+            "partial scan — tune threshold if needed",
+            total_names,
+            _MAX_TOTAL_NAMES,
+        )
+        # Truncate each file's name list proportionally by capping the flat list.
+        truncated: dict[str, list[str]] = {}
+        remaining = _MAX_TOTAL_NAMES
+        for p, names in file_names.items():
+            take = min(len(names), remaining)
+            if take <= 0:
+                break
+            truncated[p] = names[:take]
+            remaining -= take
+        file_names = truncated
+    # Deduplicate pairs: only emit once per (name_a, name_b) pair regardless
+    # of how many files contain either name.
+    seen_pairs: set[frozenset[str]] = set()
+    paths = list(file_names.keys())
+    for i, path_a in enumerate(paths):
+        for path_b in paths[i + 1:]:
+            for name_a in file_names[path_a]:
+                for name_b in file_names[path_b]:
+                    if name_a == name_b:
+                        continue
+                    # FP filter 1: names too short to be meaningful.
+                    if len(name_a) < _MIN_NAME_LENGTH or len(name_b) < _MIN_NAME_LENGTH:
+                        continue
+                    # FP filter 2: plural-singular pairs (name_b == name_a + "s" or vice versa).
+                    if name_b == name_a + "s" or name_a == name_b + "s":
+                        continue
+                    # FP filter 3: intentional versioning suffix (X_v1 vs X_v2).
+                    base_a = _VERSION_SUFFIX_RE.sub("", name_a)
+                    base_b = _VERSION_SUFFIX_RE.sub("", name_b)
+                    if base_a == base_b:
+                        continue
+                    pair_key = frozenset({name_a, name_b})
+                    if pair_key in seen_pairs:
+                        continue
+                    dist = _levenshtein(name_a, name_b)
+                    # FP filter 4: similarity ratio gate.
+                    ratio = dist / max(len(name_a), len(name_b))
+                    if ratio > _MAX_SIMILARITY_RATIO:
+                        continue
+                    if dist <= 2:
+                        seen_pairs.add(pair_key)
+                        # Hard cap on findings.
+                        if len(findings) >= _MAX_FINDINGS:
+                            _log.debug(
+                                "refactor_completeness: findings capped at %d; "
+                                "tune threshold to see more",
+                                _MAX_FINDINGS,
+                            )
+                            break
+                        findings.append(
+                            build_finding(
+                                check_id="refactor.partial_rename_candidate",
+                                category=GateCategory.DRIFT,
+                                title=(
+                                    f"Possible partial rename: '{name_a}' vs '{name_b}'"
+                                ),
+                                severity=GateSeverity.MEDIUM,
+                                impact=GateImpact.WARN,
+                                summary=(
+                                    f"Name '{name_a}' in {path_a} and '{name_b}' in {path_b} "
+                                    f"differ by {dist} edit(s) — possible incomplete rename."
+                                ),
+                                recommendation=(
+                                    f"Unify naming: '{name_a}' vs '{name_b}' in "
+                                    f"{path_a} vs {path_b}. "
+                                    f"Decide the canonical name and propagate it to all call sites. "
+                                    f"If the similarity is intentional (overload, alias), add both "
+                                    f"names to the allowlist."
+                                ),
+                                evidence=[
+                                    EvidenceReference(
+                                        kind="file",
+                                        path=path_a,
+                                        detail=f"name '{name_a}'",
+                                    ),
+                                    EvidenceReference(
+                                        kind="file",
+                                        path=path_b,
+                                        detail=f"name '{name_b}'",
+                                    ),
+                                ],
+                                repair_kind=RepairKind.NORMALIZE_SHAPE.value,
+                                executor_action=(
+                                    f"Unify naming: '{name_a}' vs '{name_b}' in "
+                                    f"{path_a} vs {path_b}. "
+                                    f"Decide canonical name and propagate."
+                                ),
+                                proof_required=(
+                                    "grep for old name returns 0 matches; "
+                                    "all callers use canonical name"
+                                ),
+                                allowlist_allowed=True,
+                            )
+                        )
+    return build_check_result(
+        check_id="refactor_completeness",
+        category=GateCategory.DRIFT,
+        findings=findings,
+    )