PyPI - rdf-construct - Versions diffs - 0.2.0__py3-none-any.whl - Mend

rdf-construct 0.2.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (88) hide show

rdf_construct/__init__.py +12 -0
rdf_construct/__main__.py +0 -0
rdf_construct/cli.py +1762 -0
rdf_construct/core/__init__.py +33 -0
rdf_construct/core/config.py +116 -0
rdf_construct/core/ordering.py +219 -0
rdf_construct/core/predicate_order.py +212 -0
rdf_construct/core/profile.py +157 -0
rdf_construct/core/selector.py +64 -0
rdf_construct/core/serialiser.py +232 -0
rdf_construct/core/utils.py +89 -0
rdf_construct/cq/__init__.py +77 -0
rdf_construct/cq/expectations.py +365 -0
rdf_construct/cq/formatters/__init__.py +45 -0
rdf_construct/cq/formatters/json.py +104 -0
rdf_construct/cq/formatters/junit.py +104 -0
rdf_construct/cq/formatters/text.py +146 -0
rdf_construct/cq/loader.py +300 -0
rdf_construct/cq/runner.py +321 -0
rdf_construct/diff/__init__.py +59 -0
rdf_construct/diff/change_types.py +214 -0
rdf_construct/diff/comparator.py +338 -0
rdf_construct/diff/filters.py +133 -0
rdf_construct/diff/formatters/__init__.py +71 -0
rdf_construct/diff/formatters/json.py +192 -0
rdf_construct/diff/formatters/markdown.py +210 -0
rdf_construct/diff/formatters/text.py +195 -0
rdf_construct/docs/__init__.py +60 -0
rdf_construct/docs/config.py +238 -0
rdf_construct/docs/extractors.py +603 -0
rdf_construct/docs/generator.py +360 -0
rdf_construct/docs/renderers/__init__.py +7 -0
rdf_construct/docs/renderers/html.py +803 -0
rdf_construct/docs/renderers/json.py +390 -0
rdf_construct/docs/renderers/markdown.py +628 -0
rdf_construct/docs/search.py +278 -0
rdf_construct/docs/templates/html/base.html.jinja +44 -0
rdf_construct/docs/templates/html/class.html.jinja +152 -0
rdf_construct/docs/templates/html/hierarchy.html.jinja +28 -0
rdf_construct/docs/templates/html/index.html.jinja +110 -0
rdf_construct/docs/templates/html/instance.html.jinja +90 -0
rdf_construct/docs/templates/html/namespaces.html.jinja +37 -0
rdf_construct/docs/templates/html/property.html.jinja +124 -0
rdf_construct/docs/templates/html/single_page.html.jinja +169 -0
rdf_construct/lint/__init__.py +75 -0
rdf_construct/lint/config.py +214 -0
rdf_construct/lint/engine.py +396 -0
rdf_construct/lint/formatters.py +327 -0
rdf_construct/lint/rules.py +692 -0
rdf_construct/main.py +6 -0
rdf_construct/puml2rdf/__init__.py +103 -0
rdf_construct/puml2rdf/config.py +230 -0
rdf_construct/puml2rdf/converter.py +420 -0
rdf_construct/puml2rdf/merger.py +200 -0
rdf_construct/puml2rdf/model.py +202 -0
rdf_construct/puml2rdf/parser.py +565 -0
rdf_construct/puml2rdf/validators.py +451 -0
rdf_construct/shacl/__init__.py +56 -0
rdf_construct/shacl/config.py +166 -0
rdf_construct/shacl/converters.py +520 -0
rdf_construct/shacl/generator.py +364 -0
rdf_construct/shacl/namespaces.py +93 -0
rdf_construct/stats/__init__.py +29 -0
rdf_construct/stats/collector.py +178 -0
rdf_construct/stats/comparator.py +298 -0
rdf_construct/stats/formatters/__init__.py +83 -0
rdf_construct/stats/formatters/json.py +38 -0
rdf_construct/stats/formatters/markdown.py +153 -0
rdf_construct/stats/formatters/text.py +186 -0
rdf_construct/stats/metrics/__init__.py +26 -0
rdf_construct/stats/metrics/basic.py +147 -0
rdf_construct/stats/metrics/complexity.py +137 -0
rdf_construct/stats/metrics/connectivity.py +130 -0
rdf_construct/stats/metrics/documentation.py +128 -0
rdf_construct/stats/metrics/hierarchy.py +207 -0
rdf_construct/stats/metrics/properties.py +88 -0
rdf_construct/uml/__init__.py +22 -0
rdf_construct/uml/context.py +194 -0
rdf_construct/uml/mapper.py +371 -0
rdf_construct/uml/odm_renderer.py +789 -0
rdf_construct/uml/renderer.py +684 -0
rdf_construct/uml/uml_layout.py +393 -0
rdf_construct/uml/uml_style.py +613 -0
rdf_construct-0.2.0.dist-info/METADATA +431 -0
rdf_construct-0.2.0.dist-info/RECORD +88 -0
rdf_construct-0.2.0.dist-info/WHEEL +4 -0
rdf_construct-0.2.0.dist-info/entry_points.txt +3 -0
rdf_construct-0.2.0.dist-info/licenses/LICENSE +21 -0

rdf_construct/lint/config.py ADDED Viewed

@@ -0,0 +1,214 @@
+"""Configuration file handling for rdf-construct lint.
+Supports loading .rdf-lint.yml files with rule settings and severity overrides.
+"""
+from __future__ import annotations
+from pathlib import Path
+from typing import Any
+import yaml
+from rdf_construct.lint.engine import LintConfig
+from rdf_construct.lint.rules import Severity, list_rules
+def load_lint_config(config_path: Path) -> LintConfig:
+    """Load lint configuration from a YAML file.
+    The configuration file format:
+    ```yaml
+    # Global settings
+    level: standard  # strict | standard | relaxed
+    # Rules to enable (empty means all)
+    enable:
+      - orphan-class
+      - missing-label
+    # Rules to disable
+    disable:
+      - inconsistent-naming
+    # Override severity for specific rules
+    severity:
+      missing-comment: info
+      orphan-class: warning
+    ```
+    Args:
+        config_path: Path to the YAML configuration file.
+    Returns:
+        LintConfig with settings from the file.
+    Raises:
+        FileNotFoundError: If config file doesn't exist.
+        ValueError: If config file is invalid.
+    """
+    if not config_path.exists():
+        raise FileNotFoundError(f"Config file not found: {config_path}")
+    with open(config_path, "r", encoding="utf-8") as f:
+        try:
+            data = yaml.safe_load(f)
+        except yaml.YAMLError as e:
+            raise ValueError(f"Invalid YAML in config file: {e}")
+    if data is None:
+        data = {}
+    return _parse_config(data, config_path)
+def _parse_config(data: dict[str, Any], source: Path) -> LintConfig:
+    """Parse configuration dictionary into LintConfig.
+    Args:
+        data: Configuration dictionary from YAML.
+        source: Source file path (for error messages).
+    Returns:
+        Parsed LintConfig.
+    Raises:
+        ValueError: If configuration is invalid.
+    """
+    config = LintConfig()
+    known_rules = set(list_rules())
+    # Parse level
+    if "level" in data:
+        level = data["level"]
+        if level not in ("strict", "standard", "relaxed"):
+            raise ValueError(
+                f"Invalid level '{level}' in {source}. "
+                "Must be 'strict', 'standard', or 'relaxed'."
+            )
+        config.level = level
+    # Parse enabled rules
+    if "enable" in data:
+        enabled = data["enable"]
+        if not isinstance(enabled, list):
+            raise ValueError(f"'enable' must be a list in {source}")
+        for rule_id in enabled:
+            if rule_id not in known_rules:
+                raise ValueError(
+                    f"Unknown rule '{rule_id}' in 'enable' section of {source}. "
+                    f"Available rules: {', '.join(sorted(known_rules))}"
+                )
+            config.enabled_rules.add(rule_id)
+    # Parse disabled rules
+    if "disable" in data:
+        disabled = data["disable"]
+        if not isinstance(disabled, list):
+            raise ValueError(f"'disable' must be a list in {source}")
+        for rule_id in disabled:
+            if rule_id not in known_rules:
+                raise ValueError(
+                    f"Unknown rule '{rule_id}' in 'disable' section of {source}. "
+                    f"Available rules: {', '.join(sorted(known_rules))}"
+                )
+            config.disabled_rules.add(rule_id)
+    # Parse severity overrides
+    if "severity" in data:
+        severities = data["severity"]
+        if not isinstance(severities, dict):
+            raise ValueError(f"'severity' must be a mapping in {source}")
+        for rule_id, sev_str in severities.items():
+            if rule_id not in known_rules:
+                raise ValueError(
+                    f"Unknown rule '{rule_id}' in 'severity' section of {source}. "
+                    f"Available rules: {', '.join(sorted(known_rules))}"
+                )
+            try:
+                severity = Severity(sev_str)
+            except ValueError:
+                raise ValueError(
+                    f"Invalid severity '{sev_str}' for rule '{rule_id}' in {source}. "
+                    "Must be 'error', 'warning', or 'info'."
+                )
+            config.severity_overrides[rule_id] = severity
+    return config
+def find_config_file(start_dir: Path | None = None) -> Path | None:
+    """Find a lint config file by searching up the directory tree.
+    Looks for files named '.rdf-lint.yml' or '.rdf-lint.yaml' starting
+    from start_dir and moving up to the filesystem root.
+    Args:
+        start_dir: Directory to start searching from. Defaults to cwd.
+    Returns:
+        Path to config file if found, None otherwise.
+    """
+    if start_dir is None:
+        start_dir = Path.cwd()
+    config_names = [".rdf-lint.yml", ".rdf-lint.yaml", "rdf-lint.yml", "rdf-lint.yaml"]
+    current = start_dir.resolve()
+    while True:
+        for name in config_names:
+            config_path = current / name
+            if config_path.exists():
+                return config_path
+        parent = current.parent
+        if parent == current:
+            # Reached filesystem root
+            break
+        current = parent
+    return None
+def create_default_config() -> str:
+    """Generate a default configuration file as a string.
+    Returns:
+        YAML string with commented default configuration.
+    """
+    known_rules = sorted(list_rules())
+    return f"""\
+# rdf-construct lint configuration
+# Place this file as .rdf-lint.yml in your project root
+# Strictness level: strict | standard | relaxed
+# - strict: warnings become errors
+# - standard: default severities
+# - relaxed: warnings become info
+level: standard
+# Enable only specific rules (empty = all rules)
+# enable:
+#   - orphan-class
+#   - missing-label
+# Disable specific rules
+# disable:
+#   - inconsistent-naming
+# Override severity for specific rules
+# severity:
+#   missing-comment: info
+#   orphan-class: warning
+# Available rules:
+# {chr(10).join(f'#   - {r}' for r in known_rules)}
+"""

rdf_construct/lint/engine.py ADDED Viewed

@@ -0,0 +1,396 @@
+"""Lint engine for running rules against RDF graphs.
+The engine coordinates rule execution, applies configuration overrides,
+and collects results for reporting.
+"""
+from __future__ import annotations
+import re
+from dataclasses import dataclass, field
+from pathlib import Path
+from typing import Sequence
+from rdflib import Graph, URIRef
+from rdf_construct.lint.rules import (
+    get_all_rules,
+    get_rule,
+    LintIssue,
+    RuleSpec,
+    Severity,
+)
+def find_line_number(file_path: Path, entity: URIRef) -> int | None:
+    """Find approximate line number for an entity's definition in a Turtle file.
+    Prioritises finding the entity as a subject (its definition) rather than
+    as a predicate or object.
+    """
+    if not file_path.exists():
+        return None
+    uri_str = str(entity)
+    # Extract local name
+    if "#" in uri_str:
+        local_name = uri_str.split("#")[-1]
+    elif "/" in uri_str:
+        local_name = uri_str.rsplit("/", 1)[-1]
+    else:
+        local_name = uri_str
+    try:
+        with open(file_path, "r", encoding="utf-8") as f:
+            lines = f.readlines()
+    except (IOError, UnicodeDecodeError):
+        return None
+    # First pass: look for entity as a SUBJECT (definition)
+    # Pattern: entity at start of line (after optional whitespace), followed by 'a' or predicate
+    subject_patterns = [
+        # Full URI as subject
+        rf"^\s*<{re.escape(uri_str)}>\s+",
+        # Prefixed form as subject at start of line
+        rf"^\s*\w+:{re.escape(local_name)}\s+",
+    ]
+    for pattern in subject_patterns:
+        regex = re.compile(pattern)
+        for i, line in enumerate(lines, start=1):
+            if regex.match(line):
+                return i
+    # Second pass: find any occurrence (fallback)
+    fallback_patterns = [
+        re.escape(f"<{uri_str}>"),
+        rf"\b\w+:{re.escape(local_name)}\b",
+    ]
+    for pattern in fallback_patterns:
+        regex = re.compile(pattern)
+        for i, line in enumerate(lines, start=1):
+            if regex.search(line):
+                return i
+    return None
+@dataclass
+class LintConfig:
+    """Configuration for a lint run.
+    Attributes:
+        level: Strictness level (strict/standard/relaxed).
+        enabled_rules: Specific rules to enable (empty = all).
+        disabled_rules: Specific rules to disable.
+        severity_overrides: Override default severity for specific rules.
+    """
+    level: str = "standard"
+    enabled_rules: set[str] = field(default_factory=set)
+    disabled_rules: set[str] = field(default_factory=set)
+    severity_overrides: dict[str, Severity] = field(default_factory=dict)
+    def get_effective_rules(self) -> list[RuleSpec]:
+        """Get the list of rules that should run based on config.
+        Returns:
+            List of RuleSpec objects to execute.
+        """
+        all_rules = get_all_rules()
+        # If specific rules enabled, use only those
+        if self.enabled_rules:
+            rules = [all_rules[r] for r in self.enabled_rules if r in all_rules]
+        else:
+            rules = list(all_rules.values())
+        # Remove disabled rules
+        rules = [r for r in rules if r.rule_id not in self.disabled_rules]
+        # Apply level filtering
+        if self.level == "relaxed":
+            # Relaxed: skip INFO-level rules
+            rules = [r for r in rules if r.default_severity != Severity.INFO]
+        elif self.level == "strict":
+            # Strict: all rules, but bump warnings to errors
+            pass  # No filtering, severity handled in get_effective_severity
+        return rules
+    def get_effective_severity(self, rule_id: str) -> Severity:
+        """Get the effective severity for a rule.
+        Args:
+            rule_id: The rule identifier.
+        Returns:
+            The severity to use for this rule.
+        """
+        # Check for explicit override
+        if rule_id in self.severity_overrides:
+            return self.severity_overrides[rule_id]
+        rule = get_rule(rule_id)
+        if rule is None:
+            return Severity.ERROR
+        # Apply level adjustments
+        if self.level == "strict":
+            # In strict mode, warnings become errors
+            if rule.default_severity == Severity.WARNING:
+                return Severity.ERROR
+        elif self.level == "relaxed":
+            # In relaxed mode, warnings become info
+            if rule.default_severity == Severity.WARNING:
+                return Severity.INFO
+        return rule.default_severity
+@dataclass
+class LintResult:
+    """Result of linting a single file.
+    Attributes:
+        file_path: Path to the linted file.
+        graph: The parsed RDF graph (for namespace resolution).
+        issues: List of issues found.
+        error_count: Number of error-level issues.
+        warning_count: Number of warning-level issues.
+        info_count: Number of info-level issues.
+    """
+    file_path: Path
+    graph: Graph | None = None
+    issues: list[LintIssue] = field(default_factory=list)
+    error_count: int = 0
+    warning_count: int = 0
+    info_count: int = 0
+    def add_issue(self, issue: LintIssue) -> None:
+        """Add an issue and update counts."""
+        self.issues.append(issue)
+        if issue.severity == Severity.ERROR:
+            self.error_count += 1
+        elif issue.severity == Severity.WARNING:
+            self.warning_count += 1
+        else:
+            self.info_count += 1
+    @property
+    def total_issues(self) -> int:
+        """Total number of issues found."""
+        return len(self.issues)
+    @property
+    def has_errors(self) -> bool:
+        """Whether any errors were found."""
+        return self.error_count > 0
+    @property
+    def has_warnings(self) -> bool:
+        """Whether any warnings were found."""
+        return self.warning_count > 0
+@dataclass
+class LintSummary:
+    """Summary of linting multiple files.
+    Attributes:
+        results: Individual file results.
+        total_errors: Total errors across all files.
+        total_warnings: Total warnings across all files.
+        total_info: Total info messages across all files.
+    """
+    results: list[LintResult] = field(default_factory=list)
+    total_errors: int = 0
+    total_warnings: int = 0
+    total_info: int = 0
+    def add_result(self, result: LintResult) -> None:
+        """Add a file result and update totals."""
+        self.results.append(result)
+        self.total_errors += result.error_count
+        self.total_warnings += result.warning_count
+        self.total_info += result.info_count
+    @property
+    def exit_code(self) -> int:
+        """Get appropriate exit code based on results.
+        Returns:
+            0 if no issues, 1 if warnings only, 2 if errors.
+        """
+        if self.total_errors > 0:
+            return 2
+        if self.total_warnings > 0:
+            return 1
+        return 0
+    @property
+    def files_with_issues(self) -> int:
+        """Number of files that had at least one issue."""
+        return sum(1 for r in self.results if r.total_issues > 0)
+class LintEngine:
+    """Engine for running lint rules against RDF graphs.
+    The engine loads graphs, runs configured rules, and collects results.
+    It supports linting single files or batches of files.
+    """
+    def __init__(self, config: LintConfig | None = None):
+        """Initialise the lint engine.
+        Args:
+            config: Configuration for the lint run. Defaults to standard config.
+        """
+        self.config = config or LintConfig()
+    def _populate_line_numbers(self, result: LintResult, file_path: Path) -> None:
+        """Add line numbers to issues by searching the source file."""
+        for issue in result.issues:
+            if issue.entity and issue.line is None:
+                issue.line = find_line_number(file_path, issue.entity)
+    def lint_file(self, file_path: Path) -> LintResult:
+        """Lint a single RDF file.
+        Args:
+            file_path: Path to the RDF file.
+        Returns:
+            LintResult containing all issues found.
+        Raises:
+            FileNotFoundError: If file doesn't exist.
+            ValueError: If file can't be parsed.
+        """
+        result = LintResult(file_path=file_path)
+        # Load the graph
+        graph = Graph()
+        try:
+            # Guess format from extension
+            suffix = file_path.suffix.lower()
+            if suffix in (".ttl", ".turtle"):
+                fmt = "turtle"
+            elif suffix in (".rdf", ".xml", ".owl"):
+                fmt = "xml"
+            elif suffix in (".nt", ".ntriples"):
+                fmt = "nt"
+            elif suffix in (".n3",):
+                fmt = "n3"
+            elif suffix in (".jsonld", ".json"):
+                fmt = "json-ld"
+            else:
+                fmt = "turtle"  # Default
+            graph.parse(file_path.as_posix(), format=fmt)
+            result.graph = graph  # Store for namespace resolution
+        except Exception as e:
+            # Return result with parse error
+            result.add_issue(
+                LintIssue(
+                    rule_id="parse-error",
+                    severity=Severity.ERROR,
+                    entity=None,
+                    message=f"Failed to parse file: {e}",
+                )
+            )
+            return result
+        # Run rules
+        rules = self.config.get_effective_rules()
+        for rule in rules:
+            try:
+                issues = rule.check_fn(graph)
+                for issue in issues:
+                    # Apply severity override
+                    effective_severity = self.config.get_effective_severity(issue.rule_id)
+                    adjusted_issue = LintIssue(
+                        rule_id=issue.rule_id,
+                        severity=effective_severity,
+                        entity=issue.entity,
+                        message=issue.message,
+                        line=issue.line,
+                    )
+                    result.add_issue(adjusted_issue)
+            except Exception as e:
+                # Rule execution error
+                result.add_issue(
+                    LintIssue(
+                        rule_id=f"rule-error:{rule.rule_id}",
+                        severity=Severity.ERROR,
+                        entity=None,
+                        message=f"Rule '{rule.rule_id}' failed: {e}",
+                    )
+                )
+        # Populate line numbers
+        self._populate_line_numbers(result, file_path)
+        return result
+    def lint_files(self, file_paths: Sequence[Path]) -> LintSummary:
+        """Lint multiple RDF files.
+        Args:
+            file_paths: Paths to RDF files.
+        Returns:
+            LintSummary containing all results.
+        """
+        summary = LintSummary()
+        for path in file_paths:
+            result = self.lint_file(path)
+            summary.add_result(result)
+        return summary
+    def lint_graph(self, graph: Graph, source_name: str = "<graph>") -> LintResult:
+        """Lint an in-memory RDF graph.
+        Args:
+            graph: The RDF graph to lint.
+            source_name: Name to use in result (for display).
+        Returns:
+            LintResult containing all issues found.
+        """
+        result = LintResult(file_path=Path(source_name), graph=graph)
+        rules = self.config.get_effective_rules()
+        for rule in rules:
+            try:
+                issues = rule.check_fn(graph)
+                for issue in issues:
+                    effective_severity = self.config.get_effective_severity(issue.rule_id)
+                    adjusted_issue = LintIssue(
+                        rule_id=issue.rule_id,
+                        severity=effective_severity,
+                        entity=issue.entity,
+                        message=issue.message,
+                        line=issue.line,
+                    )
+                    result.add_issue(adjusted_issue)
+            except Exception as e:
+                result.add_issue(
+                    LintIssue(
+                        rule_id=f"rule-error:{rule.rule_id}",
+                        severity=Severity.ERROR,
+                        entity=None,
+                        message=f"Rule '{rule.rule_id}' failed: {e}",
+                    )
+                )
+        return result