PyPI - bookwright-cli - Versions diffs - 0.2.0__py3-none-any.whl - Mend

bookwright-cli 0.2.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (149) hide show

bookwright/__init__.py +3 -0
bookwright/__main__.py +6 -0
bookwright/cli.py +19 -0
bookwright/commands/__init__.py +0 -0
bookwright/commands/_envelope.py +36 -0
bookwright/commands/check.py +75 -0
bookwright/commands/graph/__init__.py +23 -0
bookwright/commands/graph/build.py +157 -0
bookwright/commands/graph/envelope.py +26 -0
bookwright/commands/graph/query.py +98 -0
bookwright/commands/init/__init__.py +5 -0
bookwright/commands/init/conflict.py +107 -0
bookwright/commands/init/envelope.py +322 -0
bookwright/commands/init/git.py +96 -0
bookwright/commands/init/main.py +263 -0
bookwright/commands/init/resolve.py +193 -0
bookwright/commands/init/scaffold.py +242 -0
bookwright/commands/init/validate.py +172 -0
bookwright/commands/integration/__init__.py +22 -0
bookwright/commands/integration/use.py +120 -0
bookwright/commands/validate.py +160 -0
bookwright/commands/version.py +35 -0
bookwright/core/__init__.py +35 -0
bookwright/core/_blocks.py +239 -0
bookwright/core/_build.py +154 -0
bookwright/core/_research_block.py +56 -0
bookwright/core/_translate.py +90 -0
bookwright/core/errors.py +127 -0
bookwright/core/iso639_1.py +200 -0
bookwright/core/manifest.py +343 -0
bookwright/errors.py +47 -0
bookwright/golem/__init__.py +71 -0
bookwright/golem/base.py +200 -0
bookwright/golem/errors.py +29 -0
bookwright/golem/modules/__init__.py +1 -0
bookwright/golem/modules/character.py +109 -0
bookwright/golem/modules/event.py +91 -0
bookwright/golem/modules/feature.py +161 -0
bookwright/golem/modules/inference.py +41 -0
bookwright/golem/modules/narrative.py +55 -0
bookwright/golem/modules/provenance.py +197 -0
bookwright/golem/modules/relationship.py +38 -0
bookwright/golem/modules/setting.py +30 -0
bookwright/golem/namespaces.py +332 -0
bookwright/golem/serialize.py +25 -0
bookwright/golem/slug.py +22 -0
bookwright/indexers/__init__.py +47 -0
bookwright/indexers/base.py +55 -0
bookwright/indexers/errors.py +80 -0
bookwright/indexers/rdflib_indexer.py +89 -0
bookwright/integrations/__init__.py +155 -0
bookwright/integrations/base.py +117 -0
bookwright/integrations/claude/__init__.py +29 -0
bookwright/integrations/constants.py +38 -0
bookwright/integrations/descriptions.py +48 -0
bookwright/integrations/errors.py +170 -0
bookwright/integrations/generic/__init__.py +56 -0
bookwright/integrations/lint.py +160 -0
bookwright/integrations/materialize.py +202 -0
bookwright/integrations/options.py +203 -0
bookwright/io/__init__.py +1 -0
bookwright/io/bible.py +500 -0
bookwright/io/errors.py +98 -0
bookwright/io/frontmatter.py +61 -0
bookwright/io/fs.py +226 -0
bookwright/io/manuscript.py +15 -0
bookwright/io/project.py +21 -0
bookwright/io/report.py +107 -0
bookwright/io/research.py +427 -0
bookwright/resources/__init__.py +1 -0
bookwright/resources/commands/bookwright-analyze.md +66 -0
bookwright/resources/commands/bookwright-bible.md +96 -0
bookwright/resources/commands/bookwright-checklist.md +67 -0
bookwright/resources/commands/bookwright-clarify.md +65 -0
bookwright/resources/commands/bookwright-constitution.md +79 -0
bookwright/resources/commands/bookwright-continuity.md +70 -0
bookwright/resources/commands/bookwright-draft.md +74 -0
bookwright/resources/commands/bookwright-outline.md +71 -0
bookwright/resources/commands/bookwright-research.md +107 -0
bookwright/resources/commands/bookwright-scenes.md +66 -0
bookwright/resources/commands/bookwright-synopsis.md +67 -0
bookwright/resources/commands/bookwright-verify.md +136 -0
bookwright/resources/commands/references/golem-character.md +65 -0
bookwright/resources/commands/references/golem-events-timeline.md +56 -0
bookwright/resources/commands/references/golem-relationships.md +53 -0
bookwright/resources/commands/references/greimas-actants.md +57 -0
bookwright/resources/commands/references/pending-protocol.md +72 -0
bookwright/resources/commands/references/propp-functions.md +54 -0
bookwright/resources/commands/references/research-format.md +136 -0
bookwright/resources/project/.bookwright/cache/.gitkeep +0 -0
bookwright/resources/project/.bookwright/schema/.gitkeep +0 -0
bookwright/resources/project/.bookwright/templates/.gitkeep +0 -0
bookwright/resources/project/.gitignore +23 -0
bookwright/resources/project/README.md.j2 +40 -0
bookwright/resources/project/__init__.py +6 -0
bookwright/resources/project/bible/characters/.gitkeep +0 -0
bookwright/resources/project/bible/constitution.md.j2 +74 -0
bookwright/resources/project/bible/glossary.md +36 -0
bookwright/resources/project/bible/locations/.gitkeep +0 -0
bookwright/resources/project/bible/pov-structure.md +43 -0
bookwright/resources/project/bible/relationships.md +36 -0
bookwright/resources/project/bible/research/_index.md +28 -0
bookwright/resources/project/bible/research/sources.md +23 -0
bookwright/resources/project/bible/settings/.gitkeep +0 -0
bookwright/resources/project/bible/subplots.md +35 -0
bookwright/resources/project/bible/themes.md +36 -0
bookwright/resources/project/bible/timeline.md +38 -0
bookwright/resources/project/manuscript/.gitkeep +0 -0
bookwright/resources/project/outline/arcs.md +34 -0
bookwright/resources/project/outline/scenes.md +31 -0
bookwright/resources/project/outline/structure.md +35 -0
bookwright/resources/project/outline/synopsis.md +25 -0
bookwright/resources/schemas/__init__.py +19 -0
bookwright/resources/schemas/golem-1.1/VERSION +1 -0
bookwright/resources/schemas/golem-1.1/golem.ttl +1947 -0
bookwright/resources/schemas/golem-1.1/version.json +8 -0
bookwright/resources/templates/__init__.py +1 -0
bookwright/resources/templates/bible/character.md.tmpl +63 -0
bookwright/resources/templates/bible/location.md.tmpl +37 -0
bookwright/resources/templates/bible/research/_index.md.tmpl +25 -0
bookwright/resources/templates/bible/research/sources.md.tmpl +21 -0
bookwright/resources/templates/bible/research/tema.md.tmpl +37 -0
bookwright/resources/templates/bible/setting.md.tmpl +38 -0
bookwright/resources/templates/manifest.template.toml +79 -0
bookwright/resources/templates/manuscript/chapter.md.tmpl +36 -0
bookwright/resources/templates/scenes/scene.md.tmpl +37 -0
bookwright/resources/vocabularies/__init__.py +6 -0
bookwright/resources/vocabularies/greimas.ttl +4 -0
bookwright/resources/vocabularies/propp.ttl +4 -0
bookwright/resources/vocabularies/sources.ttl +82 -0
bookwright/validation/__init__.py +33 -0
bookwright/validation/anchor_queries.py +223 -0
bookwright/validation/base.py +233 -0
bookwright/validation/queries.py +197 -0
bookwright/validation/registry.py +185 -0
bookwright/validation/report.py +106 -0
bookwright/validation/runner.py +65 -0
bookwright/validation/validators/__init__.py +9 -0
bookwright/validation/validators/character_presence.py +202 -0
bookwright/validation/validators/factual_anchor.py +291 -0
bookwright/validation/validators/focalization.py +152 -0
bookwright/validation/validators/setting_continuity.py +100 -0
bookwright/validation/validators/temporal.py +277 -0
bookwright_cli-0.2.0.dist-info/METADATA +218 -0
bookwright_cli-0.2.0.dist-info/RECORD +149 -0
bookwright_cli-0.2.0.dist-info/WHEEL +4 -0
bookwright_cli-0.2.0.dist-info/entry_points.txt +2 -0
bookwright_cli-0.2.0.dist-info/licenses/LICENSE +202 -0
bookwright_cli-0.2.0.dist-info/licenses/NOTICE +14 -0

bookwright/validation/validators/factual_anchor.py ADDED Viewed

@@ -0,0 +1,291 @@
+"""``factual_anchor`` — structural + chronological audit of research anchors (§ 20.6).
+The fifth built-in validator. A pure graph consumer (FR-003): it reads the anchor
+sub-graph through :mod:`bookwright.validation.anchor_queries` and the manifest
+through the :class:`ValidationContext`, and emits
+* **warnings** for structural defects — an unsourced anchor (R1/FR-006), a source
+  missing a mandatory provenance facet (R2/FR-007), under-reliable support
+  (R3/FR-008), and a missing promoted finding or constrained entity (R4/FR-009);
+* an **error** for a hard anachronism between an anchor's time-span and the
+  interval of the event (or timeline) it constrains (R5/FR-010), decided by the
+  shared :func:`~bookwright.validation.queries.intervals_disjoint` predicate so the
+  contradiction logic is never forked from ``temporal`` (FR-011).
+It is inert — returns ``[]`` immediately — when ``[research].enabled`` is false
+(FR-015) or the graph carries no anchor (FR-016), so it costs nothing on a
+non-research project. No rdflib here: all SPARQL lives in the projection modules.
+"""
+from __future__ import annotations
+from dataclasses import dataclass
+from typing import ClassVar
+from bookwright.golem.namespaces import (
+    BW_CONSTRAINS,
+    BW_PROMOTES,
+    BW_SUPPORTED_BY,
+    RELIABILITY_IRI,
+    timeline_uri,
+)
+from bookwright.indexers import Indexer
+from bookwright.validation.anchor_queries import (
+    FACETS,
+    AnchorRecord,
+    SourceRecord,
+    entity_present,
+    load_anchors,
+    load_sources_by_anchor,
+)
+from bookwright.validation.base import Severity, ValidationContext, Violation
+from bookwright.validation.queries import (
+    EventInterval,
+    intervals_disjoint,
+    load_intervals,
+    resolve_source,
+    timeline_bounds,
+)
+# The reliability scale, lowest → highest. The rating NAMES are the single
+# vocabulary source (``RELIABILITY_IRI`` keys); only the domain ordering
+# (``baja < media < alta``) lives here. The membership guard below trips if the
+# vocabulary ever gains or renames a rating, so the scale can never silently drift.
+_RELIABILITY_ORDER: tuple[str, ...] = ("baja", "media", "alta")
+_RELIABILITY_RANK: dict[str, int] = {name: rank for rank, name in enumerate(_RELIABILITY_ORDER)}
+assert set(_RELIABILITY_RANK) == set(RELIABILITY_IRI), (
+    "reliability scale drifted from RELIABILITY_IRI"
+)
+def _label(uri: str) -> str:
+    """A short, readable name from a URI (its final path segment)."""
+    return uri.rstrip("/").rsplit("/", 1)[-1]
+def _range(interval: EventInterval) -> str:
+    """A human ``begin-end`` year range, an open bound shown as ``?``."""
+    begin = interval.begin if interval.begin is not None else "?"
+    end = interval.end if interval.end is not None else "?"
+    return f"{begin}-{end}"
+@dataclass(frozen=True)
+class _IntervalView:
+    """The run-wide interval data the anachronism rule needs (loaded once).
+    ``events`` maps every ``G5_Narrative_Event`` URI to its interval; ``timeline``
+    is the overall bounds for a timeline-targeting anchor (``None`` when no anchor
+    carries a span, so the data was never loaded).
+    """
+    events: dict[str, EventInterval]
+    timeline: EventInterval | None
+class FactualAnchor:
+    """Audits each research anchor's structural integrity and chronology."""
+    name: ClassVar[str] = "factual_anchor"
+    severity_default: ClassVar[Severity] = Severity.warning
+    def validate(self, project: ValidationContext, indexer: Indexer) -> list[Violation]:
+        if project.manifest.research.enabled is False:
+            return []  # FR-015: the research system is turned off
+        anchors = load_anchors(indexer)
+        if not anchors:
+            return []  # FR-016: nothing to audit on a non-research project
+        sources_by_anchor = load_sources_by_anchor(indexer)
+        # Interval data is only loaded when at least one anchor carries a time-span —
+        # a non-temporal research project pays nothing for the anachronism rule.
+        spanned = any(a.span.begin is not None or a.span.end is not None for a in anchors)
+        events = load_intervals(indexer) if spanned else {}
+        intervals = _IntervalView(
+            events=events,
+            timeline=timeline_bounds(events) if spanned else None,
+        )
+        out: list[Violation] = []
+        for anchor in anchors:  # already sorted by URI (deterministic, FR-003)
+            sources = sources_by_anchor.get(anchor.uri, [])
+            out.extend(self._audit(anchor, sources, intervals, project, indexer))
+        return out
+    def _audit(
+        self,
+        anchor: AnchorRecord,
+        sources: list[SourceRecord],
+        intervals: _IntervalView,
+        project: ValidationContext,
+        indexer: Indexer,
+    ) -> list[Violation]:
+        """Run every rule against one anchor, collecting its violations in order."""
+        finding_present = entity_present(indexer, anchor.promotes, project.uri_base)
+        out: list[Violation] = []
+        out.extend(self._unsourced(anchor, sources, finding_present, indexer))
+        out.extend(self._incomplete(anchor, sources, project, indexer))
+        out.extend(self._under_reliable(anchor, sources, project, indexer))
+        out.extend(self._missing_entity(anchor, finding_present, project, indexer))
+        out.extend(self._anachronism(anchor, intervals, project, indexer))
+        return out
+    def _violation(
+        self, anchor: AnchorRecord, indexer: Indexer, message: str, triple: tuple[str, str, str]
+    ) -> Violation:
+        """A ``warning`` carrying the anchor's locator (``None`` today) + one edge."""
+        return Violation(
+            validator=self.name,
+            severity=Severity.warning,
+            message=message,
+            source=resolve_source(indexer, anchor.uri),
+            triples=(triple,),
+        )
+    # --- R1 unsourced (FR-006) ----------------------------------------------
+    def _unsourced(
+        self,
+        anchor: AnchorRecord,
+        sources: list[SourceRecord],
+        finding_present: bool,
+        indexer: Indexer,
+    ) -> list[Violation]:
+        # Suppressed when the finding is absent — R4 reports that once (no double-label).
+        if not finding_present or sources:
+            return []
+        message = f"anchor '{_label(anchor.uri)}' promotes a finding with no supporting source"
+        triple = (anchor.uri, str(BW_PROMOTES), anchor.promotes)
+        return [self._violation(anchor, indexer, message, triple)]
+    # --- R2 provenance-incomplete (FR-007) ----------------------------------
+    def _incomplete(
+        self,
+        anchor: AnchorRecord,
+        sources: list[SourceRecord],
+        project: ValidationContext,
+        indexer: Indexer,
+    ) -> list[Violation]:
+        book_language = project.manifest.book.language
+        out: list[Violation] = []
+        for source in sources:
+            # The implicated edge is the real finding→source link that locates the
+            # source; a missing facet has no object, so it is never a fabricated triple.
+            located = (anchor.promotes, str(BW_SUPPORTED_BY), source.uri)
+            for facet in FACETS:
+                if str(facet.predicate) in source.present_predicates:
+                    continue
+                # ``translation`` is mandatory only for a foreign-language source; if
+                # the language itself is unknown it is already flagged, so skip here.
+                if facet.foreign_only and (
+                    source.original_language is None or source.original_language == book_language
+                ):
+                    continue
+                message = (
+                    f"source '{_label(source.uri)}' backing anchor '{_label(anchor.uri)}' "
+                    f"is missing its {facet.label}"
+                )
+                out.append(self._violation(anchor, indexer, message, located))
+        return out
+    # --- R3 under-reliable (FR-008) -----------------------------------------
+    def _under_reliable(
+        self,
+        anchor: AnchorRecord,
+        sources: list[SourceRecord],
+        project: ValidationContext,
+        indexer: Indexer,
+    ) -> list[Violation]:
+        if not sources:  # an unsourced anchor is R1's concern, not R3's (no double-label)
+            return []
+        minimum = project.manifest.research.min_reliability_for_anchor
+        rated = [_RELIABILITY_RANK[s.reliability] for s in sources if s.reliability is not None]
+        # No rated source at all → below every threshold; else compare the best.
+        if rated and max(rated) >= _RELIABILITY_RANK[minimum]:
+            return []
+        if rated:  # a rating is present, it is just too low
+            message = (
+                f"anchor '{_label(anchor.uri)}' is backed only by sources below the "
+                f"minimum reliability '{minimum}'"
+            )
+        else:  # sources exist but none carries a rating at all — not "below", unrated
+            message = (
+                f"anchor '{_label(anchor.uri)}' is backed by sources but none carries a "
+                f"reliability rating (minimum required: '{minimum}')"
+            )
+        triple = (anchor.uri, str(BW_PROMOTES), anchor.promotes)
+        return [self._violation(anchor, indexer, message, triple)]
+    # --- R4 missing entity (FR-009) -----------------------------------------
+    def _missing_entity(
+        self,
+        anchor: AnchorRecord,
+        finding_present: bool,
+        project: ValidationContext,
+        indexer: Indexer,
+    ) -> list[Violation]:
+        out: list[Violation] = []
+        if not finding_present:
+            message = f"anchor '{_label(anchor.uri)}' promotes a finding not present in the graph"
+            triple = (anchor.uri, str(BW_PROMOTES), anchor.promotes)
+            out.append(self._violation(anchor, indexer, message, triple))
+        target = anchor.constrains
+        target_present = target is not None and entity_present(indexer, target, project.uri_base)
+        if not target_present:
+            message = (
+                f"anchor '{_label(anchor.uri)}' constrains a narrative entity "
+                "that is not present in the graph"
+            )
+            # The dropped-link case has no constrains triple → cite the promotes edge.
+            triple = (
+                (anchor.uri, str(BW_CONSTRAINS), target)
+                if target is not None
+                else (anchor.uri, str(BW_PROMOTES), anchor.promotes)
+            )
+            out.append(self._violation(anchor, indexer, message, triple))
+        return out
+    # --- R5 anachronism (FR-010/FR-012) -------------------------------------
+    def _anachronism(
+        self,
+        anchor: AnchorRecord,
+        intervals: _IntervalView,
+        project: ValidationContext,
+        indexer: Indexer,
+    ) -> list[Violation]:
+        span = anchor.span
+        if span.begin is None and span.end is None:
+            return []  # no time-span → nothing to compare against
+        target = anchor.constrains
+        if target is None:
+            return []  # dropped link — already R4's concern, no interval to compare
+        target_interval = self._target_interval(target, intervals, project.uri_base)
+        if target_interval is None:
+            return []  # non-temporal / non-event target → no comparable interval (FR-012)
+        if not intervals_disjoint(span, target_interval):
+            return []
+        message = (
+            f"anchor '{_label(anchor.uri)}' ({_range(span)}) constrains "
+            f"'{_label(target)}' ({_range(target_interval)}), but their year ranges "
+            "are disjoint (anachronism)"
+        )
+        return [
+            Violation(
+                validator=self.name,
+                severity=Severity.error,
+                message=message,
+                source=resolve_source(indexer, anchor.uri),
+                triples=((anchor.uri, str(BW_CONSTRAINS), target),),
+            )
+        ]
+    def _target_interval(
+        self, target: str, intervals: _IntervalView, uri_base: str
+    ) -> EventInterval | None:
+        """The interval to compare the span against: timeline bounds, an event's
+        interval, or ``None`` for a non-temporal / non-event target (D3)."""
+        if target == str(timeline_uri(uri_base)):
+            return intervals.timeline
+        return intervals.events.get(target)

bookwright/validation/validators/focalization.py ADDED Viewed

@@ -0,0 +1,152 @@
+"""``focalization`` — prose vs. the declared narrative voice (FR-018, research D5).
+Reads the constitution's narrative-voice declaration (Spanish "Voz narrativa" or
+English "Narrative voice", case-insensitive) for the declared grammatical person and,
+if a bible character is named there, the focal character. Then flags two heuristic
+breaks, LLM-free, defaulting to ``warning``:
+* first-person pronouns outside dialogue when **third person** is declared,
+* interiority verbs attached to a **non-focal** bible character (head-hopping) under
+  **third-person-limited**.
+No parsable declaration → zero findings (edge case).
+"""
+from __future__ import annotations
+import re
+from dataclasses import dataclass
+from typing import ClassVar
+from bookwright.indexers import Indexer
+from bookwright.validation.base import Severity, ValidationContext, Violation
+_DECLARATION = re.compile(r"(?im)^\s*(?:voz narrativa|narrative voice)\s*:\s*(?P<body>.+)$")
+_THIRD = re.compile(r"(?i)\b(tercera|third)\b")
+_FIRST = re.compile(r"(?i)\b(primera|first)\b")
+_LIMITED = re.compile(r"(?i)\b(limitada|limitado|limited)\b")
+# First-person markers we treat as a voice break outside dialogue (conservative).
+_FIRST_PERSON = re.compile(r"(?i)(?<![\wáéíóúñ])(yo|nosotros|nosotras|i|we)(?![\wáéíóúñ])")
+# Lines that are dialogue (Spanish em-dash openers or quotation marks) are exempt.
+# Spanish typography (en/em dashes, angle + curly quotes) is intentional here.
+_DIALOGUE_PREFIX = ("—", "–", "-", '"', "«", "“", "'", "‘")  # noqa: RUF001
+# Interiority verbs — third-person reports of a character's inner life.
+_INTERIORITY = re.compile(
+    r"(?i)(?<![\wáéíóúñ])"
+    r"(pensó|sintió|supo|recordó|creyó|temió|imaginó|comprendió|deseó|"
+    r"thought|felt|knew|remembered|believed|feared|wondered|realized|realised|wished)"
+    r"(?![\wáéíóúñ])"
+)
+@dataclass(frozen=True)
+class _Declaration:
+    person: str | None  # "first" | "third" | None
+    limited: bool
+    focal: str | None  # bible character named in the declaration, if any
+class Focalization:
+    """Flags prose that breaks the declared narrative person / focal character."""
+    name: ClassVar[str] = "focalization"
+    severity_default: ClassVar[Severity] = Severity.warning
+    def validate(self, project: ValidationContext, indexer: Indexer) -> list[Violation]:
+        constitution = project.constitution_text()
+        if constitution is None:
+            return []
+        character_names = [name for name, _ in project.character_names()]
+        declaration = _parse_declaration(constitution, character_names)
+        if declaration is None or declaration.person is None:
+            return []
+        files = project.manuscript_files()
+        out: list[Violation] = []
+        if declaration.person == "third":
+            out.extend(self._first_person_breaks(files))
+            if declaration.limited:
+                out.extend(self._head_hopping(files, character_names, declaration.focal))
+        return out
+    def _first_person_breaks(self, files: tuple[tuple[str, str], ...]) -> list[Violation]:
+        out: list[Violation] = []
+        for relpath, text in files:
+            for lineno, line in enumerate(text.splitlines(), start=1):
+                if _is_dialogue(line):
+                    continue
+                match = _FIRST_PERSON.search(line)
+                if match:
+                    out.append(
+                        Violation(
+                            validator=self.name,
+                            severity=Severity.warning,
+                            message=(
+                                f"first-person marker '{match.group(1)}' outside dialogue, but "
+                                "the constitution declares a third-person narrative voice"
+                            ),
+                            source=f"{relpath}:{lineno}",
+                            triples=(),
+                        )
+                    )
+                    break  # one finding per file (citing the first break)
+        return out
+    def _head_hopping(
+        self,
+        files: tuple[tuple[str, str], ...],
+        character_names: list[str],
+        focal: str | None,
+    ) -> list[Violation]:
+        non_focal = sorted(n for n in character_names if n != focal)
+        seen: set[str] = set()
+        out: list[Violation] = []
+        for relpath, text in files:
+            for lineno, line in enumerate(text.splitlines(), start=1):
+                if not _INTERIORITY.search(line):
+                    continue
+                for name in non_focal:
+                    if name in seen:
+                        continue
+                    if re.search(rf"\b{re.escape(name)}\b", line):
+                        seen.add(name)
+                        out.append(
+                            Violation(
+                                validator=self.name,
+                                severity=Severity.warning,
+                                message=(
+                                    f"interiority attributed to '{name}', a non-focal character, "
+                                    "under a third-person-limited narrative voice (head-hopping)"
+                                ),
+                                source=f"{relpath}:{lineno}",
+                                triples=(),
+                            )
+                        )
+        return out
+def _parse_declaration(text: str, character_names: list[str]) -> _Declaration | None:
+    match = _DECLARATION.search(text)
+    if match is None:
+        return None
+    body = match.group("body")
+    person: str | None = None
+    if _THIRD.search(body):
+        person = "third"
+    elif _FIRST.search(body):
+        person = "first"
+    focal = next(
+        (
+            name
+            for name in sorted(character_names, key=len, reverse=True)
+            if re.search(rf"\b{re.escape(name)}\b", body)
+        ),
+        None,
+    )
+    return _Declaration(person=person, limited=bool(_LIMITED.search(body)), focal=focal)
+def _is_dialogue(line: str) -> bool:
+    stripped = line.lstrip()
+    return stripped.startswith(_DIALOGUE_PREFIX)

bookwright/validation/validators/setting_continuity.py ADDED Viewed

@@ -0,0 +1,100 @@
+"""``setting_continuity`` — contradicting descriptors for one setting (FR-017, D4).
+A small built-in **contradiction lexicon** of antonym groups (e.g. *coastal* /
+*inland*). When the same setting is described with two terms from one group in
+**different files**, that is a continuity warning citing both locations. Heuristic
+and LLM-free, so it defaults to ``warning`` — it never gates CI.
+"""
+from __future__ import annotations
+import re
+from typing import ClassVar
+from bookwright.indexers import Indexer
+from bookwright.validation.base import Severity, ValidationContext, Violation
+# Antonym groups: two terms from one group on one setting, in different files, clash.
+_LEXICON: tuple[tuple[str, ...], ...] = (
+    ("coastal", "inland"),
+    ("costera", "costero", "interior"),
+    ("urban", "rural"),
+    ("urbana", "urbano", "rural"),
+    ("mountainous", "flat"),
+    ("montañosa", "montañoso", "llana", "llano"),
+    ("tropical", "arctic"),
+    ("desert", "forest"),
+    ("desierto", "bosque"),
+)
+# Word-boundary matcher per lexicon term, compiled once at import (not per line).
+_TERM_PATTERNS: dict[str, re.Pattern[str]] = {
+    term: re.compile(rf"\b{re.escape(term)}\b", re.IGNORECASE)
+    for group in _LEXICON
+    for term in group
+}
+class SettingContinuity:
+    """Flags a setting tagged with mutually-exclusive descriptors across files."""
+    name: ClassVar[str] = "setting_continuity"
+    severity_default: ClassVar[Severity] = Severity.warning
+    def validate(self, project: ValidationContext, indexer: Indexer) -> list[Violation]:
+        files = project.manuscript_files()
+        out: list[Violation] = []
+        for setting_name, _ in project.setting_names():
+            out.extend(self._check_setting(setting_name, files))
+        return out
+    def _check_setting(
+        self, setting_name: str, files: tuple[tuple[str, str], ...]
+    ) -> list[Violation]:
+        name_re = re.compile(rf"\b{re.escape(setting_name)}\b", re.IGNORECASE)
+        # term → (relpath, line) of its first occurrence in a file mentioning the setting.
+        occurrences: dict[str, tuple[str, int]] = {}
+        for relpath, text in files:
+            if not name_re.search(text):
+                continue
+            for lineno, line in enumerate(text.splitlines(), start=1):
+                for term, pattern in _TERM_PATTERNS.items():
+                    if term in occurrences:
+                        continue
+                    if pattern.search(line):
+                        occurrences[term] = (relpath, lineno)
+        out: list[Violation] = []
+        for group in _LEXICON:
+            present = [term for term in group if term in occurrences]
+            clash = _first_cross_file_pair(present, occurrences)
+            if clash is None:
+                continue
+            (term_a, loc_a), (term_b, loc_b) = clash
+            src_a, line_a = loc_a
+            src_b, line_b = loc_b
+            out.append(
+                Violation(
+                    validator=self.name,
+                    severity=Severity.warning,
+                    message=(
+                        f"setting '{setting_name}' is described as '{term_a}' "
+                        f"({src_a}:{line_a}) and '{term_b}' ({src_b}:{line_b}) — "
+                        "contradicting descriptors across files"
+                    ),
+                    source=f"{src_a}:{line_a}",
+                    triples=(),
+                )
+            )
+        return out
+def _first_cross_file_pair(
+    present: list[str], occurrences: dict[str, tuple[str, int]]
+) -> tuple[tuple[str, tuple[str, int]], tuple[str, tuple[str, int]]] | None:
+    """The first pair of present terms whose recorded files differ (sorted, D8)."""
+    for i in range(len(present)):
+        for j in range(i + 1, len(present)):
+            a, b = present[i], present[j]
+            if occurrences[a][0] != occurrences[b][0]:
+                return (a, occurrences[a]), (b, occurrences[b])
+    return None