PyPI - trustrender - Versions diffs - 0.1.0__py3-none-any.whl - Mend

trustrender 0.1.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (34) hide show

trustrender/__init__.py +607 -0
trustrender/cli.py +783 -0
trustrender/contract.py +767 -0
trustrender/dashboard.py +371 -0
trustrender/doctor.py +363 -0
trustrender/engine.py +364 -0
trustrender/errors.py +112 -0
trustrender/filters.py +57 -0
trustrender/fingerprint.py +700 -0
trustrender/fonts/Inter/Inter-Bold.ttf +0 -0
trustrender/fonts/Inter/Inter-BoldItalic.ttf +0 -0
trustrender/fonts/Inter/Inter-Italic.ttf +0 -0
trustrender/fonts/Inter/Inter-Regular.ttf +0 -0
trustrender/fonts/Inter/LICENSE.txt +92 -0
trustrender/playground/assets/index-NINB-pNr.js +31 -0
trustrender/playground/assets/index-V6TpJlAv.css +2 -0
trustrender/playground/assets/pdf.worker-C1breYqn.mjs +56901 -0
trustrender/playground/favicon.svg +14 -0
trustrender/playground/icons.svg +24 -0
trustrender/playground/index.html +17 -0
trustrender/provenance.py +257 -0
trustrender/readiness.py +659 -0
trustrender/regression.py +580 -0
trustrender/semantic.py +688 -0
trustrender/server.py +577 -0
trustrender/templates.py +149 -0
trustrender/trace.py +321 -0
trustrender/zugferd.py +565 -0
trustrender-0.1.0.dist-info/METADATA +262 -0
trustrender-0.1.0.dist-info/RECORD +34 -0
trustrender-0.1.0.dist-info/WHEEL +5 -0
trustrender-0.1.0.dist-info/entry_points.txt +2 -0
trustrender-0.1.0.dist-info/licenses/LICENSE +21 -0
trustrender-0.1.0.dist-info/top_level.txt +1 -0

trustrender/__init__.py ADDED Viewed

@@ -0,0 +1,607 @@
+"""TrustRender: fast, code-first PDF generation from structured data."""
+from __future__ import annotations
+import json
+import os
+from dataclasses import dataclass
+from pathlib import Path
+from .engine import CompileBackend, compile_typst, compile_typst_file
+from .errors import ErrorCode, TrustRenderError
+@dataclass
+class RenderResult:
+    """Internal result from the render pipeline. Not part of the public API."""
+    pdf_bytes: bytes
+    trace_id: str | None = None
+# Re-export for public API
+from .errors import ErrorCode as ErrorCode  # noqa: F811
+from .templates import render_template
+__version__ = "0.1.0"
+__all__ = [
+    "render", "audit", "AuditResult",
+    "TrustRenderError", "ErrorCode", "__version__", "bundled_font_dir",
+]
+# Resolved once at import time — deterministic across local, test, and container.
+# Check multiple locations: env var, installed package, dev layout.
+def _find_bundled_fonts() -> Path | None:
+    """Find bundled font directory. Checked once at import time."""
+    # 1. Environment variable (explicit override, used in containers)
+    env_path = os.environ.get("TRUSTRENDER_FONT_PATH")
+    if env_path:
+        p = Path(env_path)
+        if p.is_dir():
+            return p.resolve()
+    # 2. Installed package: fonts/ inside the trustrender package directory
+    pkg_path = Path(__file__).resolve().parent / "fonts"
+    if pkg_path.is_dir():
+        return pkg_path
+    # 3. Development layout: src/trustrender/__init__.py -> ../../fonts/
+    dev_path = Path(__file__).resolve().parent.parent.parent / "fonts"
+    if dev_path.is_dir():
+        return dev_path
+    return None
+_BUNDLED_FONT_DIR = _find_bundled_fonts()
+def bundled_font_dir() -> Path | None:
+    """Return the path to the bundled font directory, or None if not found."""
+    return _BUNDLED_FONT_DIR
+def _build_font_paths(
+    font_paths: list[str | os.PathLike] | None,
+) -> list[str] | None:
+    """Build the final font_paths list.
+    Font precedence:
+      1. Explicit font_paths passed by caller
+      2. Bundled font directory (``fonts/`` in the package)
+      3. System fonts (Typst default behavior — always included)
+    Caller paths extend the bundled defaults.
+    """
+    result: list[str] = []
+    if font_paths:
+        result.extend(str(p) for p in font_paths)
+    bundled = bundled_font_dir()
+    if bundled:
+        bundled_str = str(bundled)
+        if bundled_str not in result:
+            result.append(bundled_str)
+    return result or None
+def _render_document_pipeline(
+    template_path: Path,
+    data: dict,
+    *,
+    debug: bool = False,
+    font_paths: list[str] | None = None,
+    validate: bool = True,
+    zugferd: str | None = None,
+    provenance: bool = False,
+    backend: CompileBackend | None = None,
+    timeout: float | None = None,
+    display_name: str | None = None,
+) -> RenderResult:
+    """Shared render pipeline: validate, preprocess, compile, post-process.
+    All inputs must be pre-resolved (paths exist, data is a dict, fonts are
+    string paths).  This is the single source of truth for render semantics —
+    both ``render()`` and the server call this.
+    Pipeline stages (in order):
+      1. ZUGFeRD data validation (EN 16931 requirements)
+      2. Contract validation (opt-in, Jinja2 templates only)
+      3. Template preprocessing (Jinja2) + Typst compilation
+      4. ZUGFeRD post-processing (XML build + PDF embed)
+      5. Provenance embedding (after all other processing)
+    The ordering of stages 4 and 5 is load-bearing: provenance uses
+    clone_from to preserve ZUGFeRD metadata and embedded files.
+    If ``TRUSTRENDER_HISTORY`` is set, a stage-by-stage RenderTrace is
+    recorded to the trace store after each render (success or failure).
+    """
+    import hashlib
+    import time
+    from .trace import RenderTrace, StageTrace, get_store
+    is_jinja = template_path.name.endswith(".j2.typ")
+    trace = RenderTrace(
+        template_name=display_name or template_path.name,
+        template_hash=f"sha256:{hashlib.sha256(template_path.read_bytes()).hexdigest()[:16]}",
+        data_hash=f"sha256:{hashlib.sha256(json.dumps(data, sort_keys=True, separators=(',',':')).encode()).hexdigest()[:16]}",
+        engine_version=__version__,
+        zugferd_profile=zugferd or "",
+        validated=validate,
+    )
+    pipeline_start = time.monotonic()
+    def _record_trace(outcome: str, pdf_size: int = 0, error: TrustRenderError | None = None) -> None:
+        trace.outcome = outcome
+        trace.pdf_size = pdf_size
+        trace.total_ms = int((time.monotonic() - pipeline_start) * 1000)
+        if error:
+            trace.error_code = error.code.value
+            trace.error_stage = error.stage
+            trace.error_message = str(error).split("\n")[0]
+        store = get_store()
+        if store:
+            try:
+                store.record(trace)
+            except Exception:
+                pass  # Lineage is observability, not a gate
+    try:
+        # 1. ZUGFeRD invoice data validation
+        if zugferd:
+            from .zugferd import validate_zugferd_invoice_data
+            t0 = time.monotonic()
+            errors = validate_zugferd_invoice_data(data, profile=zugferd)
+            stage = StageTrace(
+                stage="zugferd_validation",
+                status="fail" if errors else "pass",
+                duration_ms=int((time.monotonic() - t0) * 1000),
+                checks_run=len(errors) + (1 if not errors else 0),
+                checks_passed=0 if errors else 1,
+                checks_failed=len(errors),
+                errors=[{"path": e.path, "message": e.message} for e in errors],
+                metadata={"profile": zugferd},
+            )
+            trace.stages.append(stage)
+            if errors:
+                detail = "\n".join(f"  {e.path}: {e.message}" for e in errors)
+                exc = TrustRenderError(
+                    f"Invoice data does not satisfy EN 16931: {len(errors)} error(s)",
+                    code=ErrorCode.ZUGFERD_ERROR,
+                    stage="zugferd_validation",
+                    detail=detail,
+                    template_path=str(template_path),
+                    validation_errors=errors,
+                )
+                _record_trace("error", error=exc)
+                raise exc
+        # 2. Contract validation (opt-in, Jinja2 templates only)
+        if validate and is_jinja:
+            from .contract import (
+                format_contract_detail,
+                format_contract_errors,
+                infer_contract,
+                validate_data,
+            )
+            t0 = time.monotonic()
+            contract = infer_contract(template_path)
+            validation_errors = validate_data(contract, data)
+            stage = StageTrace(
+                stage="contract_validation",
+                status="fail" if validation_errors else "pass",
+                duration_ms=int((time.monotonic() - t0) * 1000),
+                checks_run=len(contract),
+                checks_passed=len(contract) - len(validation_errors),
+                checks_failed=len(validation_errors),
+                errors=[{"path": e.path, "message": e.message} for e in validation_errors],
+            )
+            trace.stages.append(stage)
+            if validation_errors:
+                exc = TrustRenderError(
+                    format_contract_errors(validation_errors, template_path.name),
+                    code=ErrorCode.DATA_CONTRACT,
+                    stage="data_validation",
+                    template_path=str(template_path),
+                    detail=format_contract_detail(validation_errors, contract),
+                )
+                _record_trace("error", error=exc)
+                raise exc
+        # 3. Template preprocessing + compilation
+        t0 = time.monotonic()
+        pdf_standards = ["a-3b"] if zugferd else None
+        if is_jinja:
+            rendered = render_template(template_path, data)
+            pdf_bytes = compile_typst(
+                rendered,
+                template_path.parent,
+                debug=debug,
+                font_paths=font_paths,
+                template_path=template_path,
+                backend=backend,
+                timeout=timeout,
+                pdf_standards=pdf_standards,
+            )
+        else:
+            pdf_bytes = compile_typst_file(
+                template_path,
+                font_paths=font_paths,
+                backend=backend,
+                timeout=timeout,
+                pdf_standards=pdf_standards,
+            )
+        trace.stages.append(StageTrace(
+            stage="compilation",
+            status="pass",
+            duration_ms=int((time.monotonic() - t0) * 1000),
+            metadata={
+                "template_type": "jinja2" if is_jinja else "raw",
+                "pdf_standards": pdf_standards or [],
+                "pdf_size": len(pdf_bytes),
+            },
+        ))
+        # 4. ZUGFeRD post-processing
+        if zugferd:
+            from .zugferd import apply_zugferd, build_invoice_xml
+            t0 = time.monotonic()
+            try:
+                xml_bytes = build_invoice_xml(data, profile=zugferd)
+                # XSD + Schematron validation: guard rail before embedding XML
+                from .zugferd import validate_zugferd_xml
+                xml_errors = validate_zugferd_xml(xml_bytes)
+                if xml_errors:
+                    raise TrustRenderError(
+                        f"Generated XML failed validation: {xml_errors[0]}",
+                        code=ErrorCode.ZUGFERD_ERROR,
+                        stage="zugferd",
+                        detail="; ".join(xml_errors),
+                        template_path=str(template_path),
+                    )
+                pdf_bytes = apply_zugferd(pdf_bytes, xml_bytes)
+                trace.stages.append(StageTrace(
+                    stage="zugferd_postprocess",
+                    status="pass",
+                    duration_ms=int((time.monotonic() - t0) * 1000),
+                    metadata={"xml_size": len(xml_bytes), "profile": zugferd},
+                ))
+            except TrustRenderError:
+                raise
+            except Exception as exc:
+                raise TrustRenderError(
+                    f"ZUGFeRD generation failed: {exc}",
+                    code=ErrorCode.ZUGFERD_ERROR,
+                    stage="zugferd",
+                    detail=str(exc),
+                    template_path=str(template_path),
+                ) from exc
+        # 5. Provenance (AFTER ZUGFeRD — uses clone_from to preserve metadata)
+        if provenance:
+            from .provenance import create_provenance, embed_provenance
+            t0 = time.monotonic()
+            prov_record = create_provenance(template_path, data)
+            pdf_bytes = embed_provenance(pdf_bytes, prov_record)
+            trace.stages.append(StageTrace(
+                stage="provenance",
+                status="pass",
+                duration_ms=int((time.monotonic() - t0) * 1000),
+                metadata={"proof_hash": prov_record.proof[:30]},
+            ))
+            trace.provenance_hash = prov_record.proof
+        # Output fingerprint: hash the final PDF bytes after all post-processing
+        trace.output_hash = f"sha256:{hashlib.sha256(pdf_bytes).hexdigest()[:16]}"
+        _record_trace("success", pdf_size=len(pdf_bytes))
+        return RenderResult(pdf_bytes=pdf_bytes, trace_id=trace.id)
+    except TrustRenderError as exc:
+        if not trace.outcome:  # Not already recorded by a stage
+            _record_trace("error", error=exc)
+        raise
+def render(
+    template: str | os.PathLike,
+    data: dict | str | os.PathLike,
+    *,
+    output: str | os.PathLike | None = None,
+    debug: bool = False,
+    font_paths: list[str | os.PathLike] | None = None,
+    validate: bool = True,
+    zugferd: str | None = None,
+    provenance: bool = False,
+) -> bytes:
+    """Render a PDF from a template and data.
+    Args:
+        template: Path to a template file.
+            - ``.j2.typ``: Jinja2 template preprocessed then compiled with Typst.
+            - ``.typ``: Raw Typst file compiled directly.
+        data: Template data as a dict, a JSON string, or a path to a ``.json`` file.
+        output: If provided, write the PDF to this path.
+        debug: If True, preserve the intermediate ``.typ`` file after rendering.
+            On error, the intermediate file is always preserved regardless of this flag.
+        font_paths: Additional font directories.  These are prepended to the
+            bundled font directory.
+        validate: If True, validate data against the template's inferred
+            structural contract before rendering.  Raises ``TrustRenderError``
+            with code ``DATA_CONTRACT`` if validation fails.
+        zugferd: If set to ``"en16931"``, generate a ZUGFeRD-compliant
+            PDF/A-3b with embedded CII XML.  Validates invoice data against
+            EN 16931 requirements before generation.
+        provenance: If True, embed a cryptographic generation proof in the
+            PDF metadata.  Records template hash, data hash, engine version,
+            and timestamp.  Use ``verify_provenance()`` to verify later.
+    Returns:
+        PDF file contents as bytes.
+    Raises:
+        TrustRenderError: If rendering fails. Check ``code`` for the error category,
+            ``stage`` for where it failed, and ``detail`` for the full diagnostic.
+        FileNotFoundError: If the template or data file does not exist.
+    """
+    _SUPPORTED_ZUGFERD = {"en16931"}
+    if zugferd is not None and zugferd not in _SUPPORTED_ZUGFERD:
+        raise TrustRenderError(
+            f"Unsupported zugferd profile: '{zugferd}'. Supported: {sorted(_SUPPORTED_ZUGFERD)}",
+            code=ErrorCode.INVALID_DATA,
+            stage="data_resolution",
+        )
+    template_path = Path(template)
+    if not template_path.exists():
+        raise TrustRenderError(
+            f"Template not found: {template_path}",
+            code=ErrorCode.TEMPLATE_NOT_FOUND,
+            stage="data_resolution",
+            template_path=str(template_path),
+        )
+    data_dict = _resolve_data(data)
+    resolved_fonts = _build_font_paths(font_paths)
+    result = _render_document_pipeline(
+        template_path,
+        data_dict,
+        debug=debug,
+        font_paths=resolved_fonts,
+        validate=validate,
+        zugferd=zugferd,
+        provenance=provenance,
+    )
+    if output is not None:
+        output_path = Path(output)
+        output_path.parent.mkdir(parents=True, exist_ok=True)
+        output_path.write_bytes(result.pdf_bytes)
+    return result.pdf_bytes
+@dataclass
+class AuditResult:
+    """Result of an audited render: PDF bytes plus audit artifacts.
+    The ``fingerprint`` is always present.  The ``change_set`` and
+    ``drift_result`` are only present when a ``baseline_dir`` is provided
+    and a baseline exists for the template.
+    """
+    pdf_bytes: bytes
+    fingerprint: object  # InputFingerprint (avoid import at module level)
+    change_set: object | None = None  # ChangeSet | None
+    drift_result: object | None = None  # DriftResult | None
+    semantic_report: object | None = None  # SemanticReport | None
+def audit(
+    template: str | os.PathLike,
+    data: dict | str | os.PathLike,
+    *,
+    output: str | os.PathLike | None = None,
+    debug: bool = False,
+    font_paths: list[str | os.PathLike] | None = None,
+    validate: bool = True,
+    zugferd: str | None = None,
+    provenance: bool = False,
+    baseline_dir: str | os.PathLike | None = None,
+    save_baseline: bool = False,
+    semantic_hints: object | None = None,
+) -> AuditResult:
+    """Render with full audit: fingerprint, drift detection, semantic checks.
+    This is a superset of ``render()`` that also computes an input
+    fingerprint, optionally compares against a stored baseline, and
+    optionally runs semantic validation.
+    Args:
+        template: Path to a template file.
+        data: Template data (dict, JSON string, or path to .json).
+        output: If provided, write the PDF to this path.
+        debug: Preserve intermediate files.
+        font_paths: Additional font directories.
+        validate: Run structural contract validation.
+        zugferd: ZUGFeRD profile (``"en16931"``).
+        provenance: Embed generation proof.
+        baseline_dir: Root directory for baselines. If provided and a
+            baseline exists, drift checks are run. If None, only
+            fingerprinting happens.
+        save_baseline: If True, save the current render as the new
+            baseline (requires ``baseline_dir``).
+        semantic_hints: SemanticHints instance for semantic validation.
+            If None, semantic checks are skipped.
+    Returns:
+        AuditResult with PDF bytes and all audit artifacts.
+    """
+    import time
+    from .fingerprint import InputFingerprint, compare, compute_fingerprint
+    from .regression import check_drift, save_baseline as _save_baseline
+    from .semantic import SemanticReport, validate_semantics
+    _SUPPORTED_ZUGFERD = {"en16931"}
+    if zugferd is not None and zugferd not in _SUPPORTED_ZUGFERD:
+        raise TrustRenderError(
+            f"Unsupported zugferd profile: '{zugferd}'. Supported: {sorted(_SUPPORTED_ZUGFERD)}",
+            code=ErrorCode.INVALID_DATA,
+            stage="data_resolution",
+        )
+    template_path = Path(template)
+    if not template_path.exists():
+        raise TrustRenderError(
+            f"Template not found: {template_path}",
+            code=ErrorCode.TEMPLATE_NOT_FOUND,
+            stage="data_resolution",
+            template_path=str(template_path),
+        )
+    data_dict = _resolve_data(data)
+    resolved_fonts = _build_font_paths(font_paths)
+    # 1. Compute input fingerprint (before rendering)
+    fingerprint = compute_fingerprint(
+        template_path,
+        data_dict,
+        font_paths=resolved_fonts,
+        zugferd_profile=zugferd,
+        provenance_enabled=provenance,
+        validate_enabled=validate,
+    )
+    # 2. Run semantic validation (if hints provided)
+    semantic_report: SemanticReport | None = None
+    if semantic_hints is not None:
+        semantic_report = validate_semantics(data_dict, hints=semantic_hints)
+    # 3. Render (uses the existing pipeline)
+    t0 = time.monotonic()
+    result = _render_document_pipeline(
+        template_path,
+        data_dict,
+        debug=debug,
+        font_paths=resolved_fonts,
+        validate=validate,
+        zugferd=zugferd,
+        provenance=provenance,
+    )
+    render_duration_ms = int((time.monotonic() - t0) * 1000)
+    pdf_bytes = result.pdf_bytes
+    # 4. Write output if requested
+    if output is not None:
+        output_path = Path(output)
+        output_path.parent.mkdir(parents=True, exist_ok=True)
+        output_path.write_bytes(pdf_bytes)
+    # 5. Drift detection (if baseline_dir provided)
+    change_set = None
+    drift_result = None
+    if baseline_dir is not None:
+        from .regression import load_baseline
+        baseline = load_baseline(baseline_dir, template_path.name)
+        if baseline is not None:
+            # Compare fingerprints for change detection
+            baseline_fp = InputFingerprint.from_dict(baseline.fingerprint_json)
+            change_set = compare(baseline_fp, fingerprint, current_data=data_dict)
+            # Run drift checks
+            drift_result = check_drift(
+                baseline_dir,
+                template_path.name,
+                fingerprint,
+                pdf_bytes,
+                zugferd_valid=zugferd is not None,
+                contract_valid=validate,
+                semantic_issue_count=(
+                    len(semantic_report.issues) if semantic_report else 0
+                ),
+            )
+    # 6. Save baseline (if requested)
+    if save_baseline and baseline_dir is not None:
+        _save_baseline(
+            baseline_dir,
+            template_path.name,
+            fingerprint,
+            pdf_bytes,
+            render_duration_ms=render_duration_ms,
+            zugferd_valid=zugferd is not None if zugferd else None,
+            contract_valid=True if validate else None,
+            semantic_issue_count=(
+                len(semantic_report.issues) if semantic_report else 0
+            ),
+        )
+    return AuditResult(
+        pdf_bytes=pdf_bytes,
+        fingerprint=fingerprint,
+        change_set=change_set,
+        drift_result=drift_result,
+        semantic_report=semantic_report,
+    )
+def _resolve_data(data: dict | str | os.PathLike) -> dict:
+    """Resolve data argument to a dict."""
+    if isinstance(data, dict):
+        return data
+    if not isinstance(data, (str, os.PathLike)):
+        raise TrustRenderError(
+            f"Data must be a dict, JSON string, or path to a .json file, "
+            f"got {type(data).__name__}",
+            code=ErrorCode.INVALID_DATA,
+            stage="data_resolution",
+        )
+    # Try as file path first
+    path = Path(data) if not isinstance(data, str) else None
+    if path is None:
+        # Could be a JSON string or a file path string
+        candidate = Path(data)
+        if candidate.exists() and candidate.suffix == ".json":
+            path = candidate
+    if path is not None and path.exists():
+        with open(path) as f:
+            return json.load(f)
+    # Try as JSON string
+    if isinstance(data, str):
+        try:
+            result = json.loads(data)
+            if isinstance(result, dict):
+                return result
+            raise TrustRenderError(
+                f"Data JSON must be an object, got {type(result).__name__}",
+                code=ErrorCode.INVALID_DATA,
+                stage="data_resolution",
+            )
+        except json.JSONDecodeError as exc:
+            raise TrustRenderError(
+                f"Invalid data: not a valid file path or JSON string: {exc}",
+                code=ErrorCode.INVALID_DATA,
+                stage="data_resolution",
+            ) from exc
+    raise TrustRenderError(
+        f"Data must be a dict, JSON string, or path to a .json file, got {type(data).__name__}",
+        code=ErrorCode.INVALID_DATA,
+        stage="data_resolution",
+    )