PyPI - envgap - Versions diffs - 0.1.0__py3-none-any.whl - Mend

envgap 0.1.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (18) hide show

envgap/__init__.py +3 -0
envgap/checker.py +397 -0
envgap/cli.py +66 -0
envgap/extractors/__init__.py +2 -0
envgap/extractors/dotenv.py +75 -0
envgap/extractors/python_ast.py +120 -0
envgap/model/__init__.py +13 -0
envgap/model/env_source.py +29 -0
envgap/model/expected_var.py +25 -0
envgap/model/finding.py +25 -0
envgap/reporters/__init__.py +2 -0
envgap/reporters/json.py +67 -0
envgap/reporters/terminal.py +183 -0
envgap-0.1.0.dist-info/METADATA +319 -0
envgap-0.1.0.dist-info/RECORD +18 -0
envgap-0.1.0.dist-info/WHEEL +4 -0
envgap-0.1.0.dist-info/entry_points.txt +2 -0
envgap-0.1.0.dist-info/licenses/LICENSE +22 -0

envgap/__init__.py ADDED Viewed

@@ -0,0 +1,3 @@
+"""envgap finds gaps in Python environment config."""
+__version__ = "0.1.0"

envgap/checker.py ADDED Viewed

@@ -0,0 +1,397 @@
+from __future__ import annotations
+import os
+from dataclasses import dataclass
+from collections.abc import Mapping
+from pathlib import Path
+from envgap.extractors.dotenv import parse_dotenv
+from envgap.extractors.python_ast import scan_python_env_usage
+from envgap.model import CodeUsage, EnvFile, ExpectedVar, Finding, Severity
+PLACEHOLDER_VALUES = {
+    "",
+    "<your-key-here>",
+    "changeme",
+    "change-me",
+    "example",
+    "insert-key-here",
+    "replace-me",
+    "todo",
+    "your-api-key",
+    "your-key",
+    "your-key-here",
+}
+ABBREVIATIONS = {
+    "db": "database",
+    "cfg": "config",
+    "conf": "config",
+    "pwd": "password",
+    "uri": "url",
+}
+@dataclass
+class CheckResult:
+    root: Path
+    env_path: Path
+    example_path: Path
+    env_file: EnvFile
+    example_file: EnvFile
+    shell_env: dict[str, str]
+    include_shell: bool
+    expected_keys: set[str]
+    code_usages: list[CodeUsage]
+    findings: list[Finding]
+    @property
+    def has_errors(self) -> bool:
+        return any(finding.severity == Severity.ERROR for finding in self.findings)
+    @property
+    def has_warnings(self) -> bool:
+        return any(finding.severity == Severity.WARNING for finding in self.findings)
+def run_check(
+    root: Path,
+    env_file: str = ".env",
+    example_file: str = ".env.example",
+    environ: Mapping[str, str] | None = None,
+    include_shell: bool = True,
+) -> CheckResult:
+    root = root.resolve()
+    env_path = root / env_file
+    example_path = root / example_file
+    actual = parse_dotenv(env_path)
+    example = parse_dotenv(example_path)
+    shell_env = dict(os.environ if environ is None else environ) if include_shell else {}
+    code_usages = scan_python_env_usage(root)
+    expected = _expected_vars(example, code_usages)
+    findings = _build_findings(actual, example, expected, code_usages, shell_env, include_shell)
+    return CheckResult(
+        root=root,
+        env_path=env_path,
+        example_path=example_path,
+        env_file=actual,
+        example_file=example,
+        shell_env=shell_env,
+        include_shell=include_shell,
+        expected_keys=set(expected),
+        code_usages=code_usages,
+        findings=findings,
+    )
+def _expected_vars(example: EnvFile, code_usages: list[CodeUsage]) -> dict[str, ExpectedVar]:
+    expected: dict[str, ExpectedVar] = {}
+    for var in example.vars:
+        expected.setdefault(var.key, ExpectedVar(key=var.key, documented_in=var.path))
+    for usage in code_usages:
+        expected.setdefault(usage.key, ExpectedVar(key=usage.key)).code_usages.append(usage)
+    return expected
+def _build_findings(
+    actual: EnvFile,
+    example: EnvFile,
+    expected: dict[str, ExpectedVar],
+    code_usages: list[CodeUsage],
+    shell_env: dict[str, str],
+    include_shell: bool,
+) -> list[Finding]:
+    findings: list[Finding] = []
+    actual_values = actual.values
+    example_values = example.values
+    expected_keys = set(expected)
+    actual_keys = set(actual_values)
+    example_keys = set(example_values)
+    if not example.path.exists():
+        findings.append(
+            Finding(
+                code="missing_example_file",
+                severity=Severity.WARNING,
+                title=".env.example was not found",
+                message="envgap could not find a documented source of expected variables.",
+                path=example.path,
+                suggestion="Add a .env.example file with every environment variable your app expects.",
+            )
+        )
+    if not actual.path.exists():
+        findings.append(
+            Finding(
+                code="missing_env_file",
+                severity=Severity.WARNING,
+                title=".env was not found",
+                message="envgap could not compare local values because .env is missing.",
+                path=actual.path,
+                suggestion="Create .env from .env.example, or pass --env-file for a different file.",
+            )
+        )
+    findings.extend(_duplicate_findings(actual))
+    findings.extend(_duplicate_findings(example))
+    for key in sorted(expected_keys - actual_keys):
+        expected_var = expected[key]
+        if not expected_var.required and not expected_var.documented_in:
+            continue
+        usage = _first_required_usage(expected_var.code_usages)
+        findings.append(
+            Finding(
+                code="missing_key",
+                severity=Severity.ERROR if expected_var.required or expected_var.documented_in else Severity.WARNING,
+                title=f"{key} is missing from .env",
+                message=_missing_message(key, expected_var, shell_env, include_shell),
+                key=key,
+                path=usage.path if usage else expected_var.documented_in,
+                line=usage.line if usage else None,
+                suggestion=_missing_suggestion(key, shell_env, include_shell),
+                details=_checked_details(key, actual, example, shell_env, include_shell) + _usage_details(expected_var.code_usages),
+            )
+        )
+    for key in sorted(actual_keys - expected_keys):
+        findings.append(
+            Finding(
+                code="undocumented_key",
+                severity=Severity.WARNING,
+                title=f"{key} is present but undocumented",
+                message=f"{key} exists in .env but is not in .env.example and was not found in Python env usage.",
+                key=key,
+                path=actual_values[key].path,
+                line=actual_values[key].line,
+                suggestion=f"Add {key} to .env.example, or remove it from .env if it is unused.",
+            )
+        )
+    for key, var in sorted(actual_values.items()):
+        if var.value == "":
+            findings.append(
+                Finding(
+                    code="empty_value",
+                    severity=Severity.ERROR if key in expected_keys else Severity.WARNING,
+                    title=f"{key} is empty",
+                    message=f"{key} is defined in .env but has no value.",
+                    key=key,
+                    path=var.path,
+                    line=var.line,
+                    suggestion=f"Set a value for {key}, or remove it if the app should use a default.",
+                )
+            )
+        elif _is_placeholder(var.value):
+            findings.append(
+                Finding(
+                    code="placeholder_value",
+                    severity=Severity.ERROR if key in expected_keys else Severity.WARNING,
+                    title=f"{key} still looks like a placeholder",
+                    message=f"{key} is set to {_mask_value(key, var.value)}, which does not look like a real value.",
+                    key=key,
+                    path=var.path,
+                    line=var.line,
+                    suggestion=f"Replace {key} with the real value for this environment.",
+                )
+            )
+    for key in sorted(_required_code_keys(code_usages) - example_keys):
+        usage = next(usage for usage in code_usages if usage.key == key and usage.required)
+        findings.append(
+            Finding(
+                code="code_missing_from_example",
+                severity=Severity.ERROR,
+                title=f"{key} is used in code but missing from .env.example",
+                message=f"{key} is required by {usage.source} but is not documented in .env.example.",
+                key=key,
+                path=usage.path,
+                line=usage.line,
+                suggestion=f"Add {key}=... to .env.example so local dev and CI know it is required.",
+            )
+        )
+    findings.extend(_typo_findings(actual_keys, expected_keys, actual))
+    findings.extend(_parse_warning_findings(actual))
+    findings.extend(_parse_warning_findings(example))
+    return sorted(findings, key=lambda f: (f.severity.value, f.code, f.key or "", str(f.path or ""), f.line or 0))
+def _duplicate_findings(env_file: EnvFile) -> list[Finding]:
+    findings: list[Finding] = []
+    for key, vars_ in sorted(env_file.duplicates.items()):
+        lines = ", ".join(str(var.line) for var in vars_)
+        findings.append(
+            Finding(
+                code="duplicate_key",
+                severity=Severity.ERROR,
+                title=f"{key} is duplicated in {env_file.path.name}",
+                message=f"{key} appears more than once in {env_file.path.name} on lines {lines}. The last value wins in many loaders.",
+                key=key,
+                path=env_file.path,
+                line=vars_[0].line,
+                suggestion=f"Keep one {key} entry in {env_file.path.name}.",
+            )
+        )
+    return findings
+def _typo_findings(actual_keys: set[str], expected_keys: set[str], actual: EnvFile) -> list[Finding]:
+    findings: list[Finding] = []
+    for actual_key in sorted(actual_keys - expected_keys):
+        for expected_key in sorted(expected_keys - actual_keys):
+            if _similar(actual_key, expected_key):
+                var = actual.values[actual_key]
+                findings.append(
+                    Finding(
+                        code="possible_typo",
+                        severity=Severity.WARNING,
+                        title=f"{actual_key} may be a typo for {expected_key}",
+                        message=f".env contains {actual_key}, but the expected variable is {expected_key}.",
+                        key=actual_key,
+                        path=var.path,
+                        line=var.line,
+                        suggestion=f"Rename {actual_key} to {expected_key} if they represent the same setting.",
+                    )
+                )
+    return findings
+def _parse_warning_findings(env_file: EnvFile) -> list[Finding]:
+    return [
+        Finding(
+            code="parse_warning",
+            severity=Severity.WARNING,
+            title="Could not parse dotenv line",
+            message=warning,
+            path=env_file.path,
+        )
+        for warning in env_file.parse_warnings
+    ]
+def _first_required_usage(usages: list[CodeUsage]) -> CodeUsage | None:
+    return next((usage for usage in usages if usage.required), usages[0] if usages else None)
+def _required_code_keys(usages: list[CodeUsage]) -> set[str]:
+    return {usage.key for usage in usages if usage.required}
+def _missing_message(key: str, expected_var: ExpectedVar, shell_env: dict[str, str], include_shell: bool) -> str:
+    required_usage = _first_required_usage(expected_var.code_usages)
+    shell_note = ""
+    if include_shell and key in shell_env:
+        shell_note = " It is present in your shell environment, so local commands may work while CI or Docker still fails."
+    if required_usage:
+        return f"{key} is required by {required_usage.source} in {required_usage.path.name}:{required_usage.line} but was not found in .env.{shell_note}"
+    if expected_var.documented_in:
+        return f"{key} is documented in {expected_var.documented_in.name} but was not found in .env.{shell_note}"
+    return f"{key} is expected but was not found in .env.{shell_note}"
+def _missing_suggestion(key: str, shell_env: dict[str, str], include_shell: bool) -> str:
+    if include_shell and key in shell_env:
+        return f"Add {key}=... to .env or document how CI/Docker should provide it."
+    return f"Add {key}=... to .env."
+def _checked_details(
+    key: str,
+    actual: EnvFile,
+    example: EnvFile,
+    shell_env: dict[str, str],
+    include_shell: bool,
+) -> list[str]:
+    return [
+        f"shell environment: {_shell_status(key, shell_env, include_shell)}",
+        f".env: {_env_file_status(key, actual)}",
+        f".env.example: {_env_file_status(key, example)}",
+    ]
+def _shell_status(key: str, shell_env: dict[str, str], include_shell: bool) -> str:
+    if not include_shell:
+        return "ignored"
+    return "found" if key in shell_env else "not found"
+def _env_file_status(key: str, env_file: EnvFile) -> str:
+    if not env_file.path.exists():
+        return "file not found"
+    if key not in env_file.values:
+        return "not found"
+    value = env_file.values[key].value
+    if value == "":
+        return "found empty"
+    if _is_placeholder(value):
+        return "found placeholder"
+    return "found"
+def _usage_details(usages: list[CodeUsage]) -> list[str]:
+    return [
+        f"{usage.path}:{usage.line}: {usage.source} ({'required' if usage.required else 'optional'})"
+        for usage in usages
+    ]
+def _is_placeholder(value: str) -> bool:
+    normalized = value.strip().lower()
+    if normalized in PLACEHOLDER_VALUES:
+        return True
+    return "your-" in normalized or normalized.startswith("<") and normalized.endswith(">")
+def _mask_value(key: str, value: str) -> str:
+    if _secret_like(key) or len(value) > 12:
+        return value[:2] + "***" + value[-2:] if len(value) > 4 else "***"
+    return repr(value)
+def _secret_like(key: str) -> bool:
+    lowered = key.lower()
+    return any(part in lowered for part in ("secret", "token", "password", "passwd", "api_key", "apikey", "key"))
+def _similar(left: str, right: str) -> bool:
+    if left == right:
+        return False
+    if left.replace("_", "") == right.replace("_", ""):
+        return True
+    if _expand_tokens(left) == _expand_tokens(right):
+        return True
+    if _token_acronym_match(left, right) or _token_acronym_match(right, left):
+        return True
+    if left.endswith(right) or right.endswith(left):
+        return True
+    return _levenshtein(left, right) <= max(2, min(len(left), len(right)) // 4)
+def _expand_tokens(value: str) -> list[str]:
+    return [ABBREVIATIONS.get(part.lower(), part.lower()) for part in value.split("_")]
+def _token_acronym_match(short: str, long: str) -> bool:
+    short_parts = short.split("_")
+    long_parts = long.split("_")
+    if len(short_parts) != len(long_parts):
+        return False
+    return all(
+        short_part == long_part or long_part.startswith(short_part)
+        for short_part, long_part in zip(short_parts, long_parts)
+    )
+def _levenshtein(left: str, right: str) -> int:
+    previous = list(range(len(right) + 1))
+    for i, left_char in enumerate(left, start=1):
+        current = [i]
+        for j, right_char in enumerate(right, start=1):
+            insert = current[j - 1] + 1
+            delete = previous[j] + 1
+            replace = previous[j - 1] + (left_char != right_char)
+            current.append(min(insert, delete, replace))
+        previous = current
+    return previous[-1]

envgap/cli.py ADDED Viewed

@@ -0,0 +1,66 @@
+from __future__ import annotations
+import argparse
+from pathlib import Path
+from envgap import __version__
+from envgap.checker import run_check
+from envgap.reporters.json import render_json
+from envgap.reporters.terminal import render_terminal
+def main(argv: list[str] | None = None) -> int:
+    parser = _build_parser()
+    args = parser.parse_args(argv)
+    if args.command == "check":
+        result = run_check(
+            Path(args.path),
+            env_file=args.env_file,
+            example_file=args.example_file,
+            include_shell=not args.no_shell,
+        )
+        strict = args.strict or args.ci
+        output = render_json(result) if args.format == "json" else render_terminal(result, strict=strict)
+        print(output)
+        if result.has_errors:
+            return 1
+        if strict and result.has_warnings:
+            return 1
+        return 0
+    parser.print_help()
+    return 0
+def _build_parser() -> argparse.ArgumentParser:
+    parser = argparse.ArgumentParser(
+        prog="envgap",
+        description="Find the gaps in your Python environment config.",
+        epilog="Start with: envgap check",
+    )
+    parser.add_argument("--version", action="version", version=f"%(prog)s {__version__}")
+    subparsers = parser.add_subparsers(dest="command")
+    check = subparsers.add_parser(
+        "check",
+        help="diagnose .env drift and Python environment variable usage",
+        description="Compare shell env, .env, .env.example, and Python code to explain config drift.",
+    )
+    check.add_argument("path", nargs="?", default=".", help="project directory to inspect (default: current directory)")
+    check.add_argument("--env-file", default=".env", help="dotenv file to compare, relative to PATH (default: .env)")
+    check.add_argument(
+        "--example-file",
+        default=".env.example",
+        help="documented dotenv example file, relative to PATH (default: .env.example)",
+    )
+    check.add_argument("--no-shell", action="store_true", help="ignore the current shell environment for deterministic checks")
+    check.add_argument("--format", choices=["terminal", "json"], default="terminal", help="output format (default: terminal)")
+    check.add_argument("--json", action="store_const", const="json", dest="format", help="shortcut for --format json")
+    check.add_argument("--strict", action="store_true", help="fail on warnings as well as errors")
+    check.add_argument("--ci", action="store_true", help="CI-friendly alias for --strict")
+    return parser
+if __name__ == "__main__":
+    raise SystemExit(main())

envgap/extractors/__init__.py ADDED Viewed

	@@ -0,0 +1,2 @@
1	+ """Extract expected and actual environment variables from project files."""
2	+

envgap/extractors/dotenv.py ADDED Viewed

@@ -0,0 +1,75 @@
+from __future__ import annotations
+import re
+from pathlib import Path
+from envgap.model import EnvFile, EnvVar
+KEY_RE = re.compile(r"^[A-Za-z_][A-Za-z0-9_]*$")
+def parse_dotenv(path: Path) -> EnvFile:
+    env_file = EnvFile(path=path)
+    seen: dict[str, list[EnvVar]] = {}
+    if not path.exists():
+        return env_file
+    for line_number, raw_line in enumerate(path.read_text(encoding="utf-8").splitlines(), start=1):
+        parsed = _parse_line(raw_line)
+        if parsed is None:
+            continue
+        key, value = parsed
+        if not KEY_RE.match(key):
+            env_file.parse_warnings.append(f"{path}:{line_number}: skipped invalid key {key!r}")
+            continue
+        var = EnvVar(key=key, value=value, path=path, line=line_number, raw=raw_line)
+        env_file.vars.append(var)
+        seen.setdefault(key, []).append(var)
+    env_file.duplicates = {key: vars_ for key, vars_ in seen.items() if len(vars_) > 1}
+    return env_file
+def _parse_line(line: str) -> tuple[str, str] | None:
+    stripped = line.strip()
+    if not stripped or stripped.startswith("#"):
+        return None
+    if stripped.startswith("export "):
+        stripped = stripped[len("export ") :].lstrip()
+    if "=" not in stripped:
+        return None
+    key, value = stripped.split("=", 1)
+    key = key.strip()
+    value = _strip_inline_comment(value.strip())
+    return key, _unquote(value)
+def _strip_inline_comment(value: str) -> str:
+    quote: str | None = None
+    escaped = False
+    for index, char in enumerate(value):
+        if escaped:
+            escaped = False
+            continue
+        if char == "\\":
+            escaped = True
+            continue
+        if char in {"'", '"'}:
+            quote = None if quote == char else char if quote is None else quote
+            continue
+        if char == "#" and quote is None and (index == 0 or value[index - 1].isspace()):
+            return value[:index].rstrip()
+    return value
+def _unquote(value: str) -> str:
+    if len(value) >= 2 and value[0] == value[-1] and value[0] in {"'", '"'}:
+        return value[1:-1]
+    return value

envgap/extractors/python_ast.py ADDED Viewed

@@ -0,0 +1,120 @@
+from __future__ import annotations
+import ast
+from pathlib import Path
+from envgap.model import CodeUsage
+SKIP_DIRS = {
+    ".git",
+    ".hg",
+    ".mypy_cache",
+    ".pytest_cache",
+    ".ruff_cache",
+    ".tox",
+    ".venv",
+    "__pycache__",
+    "build",
+    "dist",
+    "node_modules",
+    "venv",
+}
+def find_python_files(root: Path) -> list[Path]:
+    return sorted(
+        path
+        for path in root.rglob("*.py")
+        if not any(part in SKIP_DIRS for part in path.relative_to(root).parts)
+    )
+def scan_python_env_usage(root: Path) -> list[CodeUsage]:
+    usages: list[CodeUsage] = []
+    for path in find_python_files(root):
+        try:
+            tree = ast.parse(path.read_text(encoding="utf-8"), filename=str(path))
+        except (SyntaxError, UnicodeDecodeError):
+            continue
+        visitor = _EnvVisitor(path)
+        visitor.visit(tree)
+        usages.extend(visitor.usages)
+    return sorted(usages, key=lambda usage: (str(usage.path), usage.line, usage.key))
+class _EnvVisitor(ast.NodeVisitor):
+    def __init__(self, path: Path) -> None:
+        self.path = path
+        self.usages: list[CodeUsage] = []
+    def visit_Subscript(self, node: ast.Subscript) -> None:
+        if _is_os_environ(node.value):
+            key = _string_literal(node.slice)
+            if key:
+                self.usages.append(
+                    CodeUsage(
+                        key=key,
+                        path=self.path,
+                        line=node.lineno,
+                        required=True,
+                        source=f'os.environ["{key}"]',
+                    )
+                )
+        self.generic_visit(node)
+    def visit_Call(self, node: ast.Call) -> None:
+        key = None
+        source = None
+        if _is_os_getenv(node.func):
+            key = _first_string_arg(node)
+            source = f'os.getenv("{key}")' if key else "os.getenv"
+        elif _is_os_environ_get(node.func):
+            key = _first_string_arg(node)
+            source = f'os.environ.get("{key}")' if key else "os.environ.get"
+        if key and source:
+            required = len(node.args) == 1 and not any(kw.arg == "default" for kw in node.keywords)
+            self.usages.append(
+                CodeUsage(
+                    key=key,
+                    path=self.path,
+                    line=node.lineno,
+                    required=required,
+                    source=source,
+                )
+            )
+        self.generic_visit(node)
+def _is_os_environ(node: ast.AST) -> bool:
+    return (
+        isinstance(node, ast.Attribute)
+        and node.attr == "environ"
+        and isinstance(node.value, ast.Name)
+        and node.value.id == "os"
+    )
+def _is_os_getenv(node: ast.AST) -> bool:
+    return (
+        isinstance(node, ast.Attribute)
+        and node.attr == "getenv"
+        and isinstance(node.value, ast.Name)
+        and node.value.id == "os"
+    )
+def _is_os_environ_get(node: ast.AST) -> bool:
+    return isinstance(node, ast.Attribute) and node.attr == "get" and _is_os_environ(node.value)
+def _first_string_arg(node: ast.Call) -> str | None:
+    if not node.args:
+        return None
+    return _string_literal(node.args[0])
+def _string_literal(node: ast.AST) -> str | None:
+    if isinstance(node, ast.Constant) and isinstance(node.value, str):
+        return node.value
+    return None

envgap/model/__init__.py ADDED Viewed

@@ -0,0 +1,13 @@
+from envgap.model.env_source import EnvFile, EnvVar
+from envgap.model.expected_var import CodeUsage, ExpectedVar
+from envgap.model.finding import Finding, Severity
+__all__ = [
+    "CodeUsage",
+    "EnvFile",
+    "EnvVar",
+    "ExpectedVar",
+    "Finding",
+    "Severity",
+]