PyPI - crieur - Versions diffs - 2.0.2__py3-none-any.whl - Mend

crieur 2.0.2__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (27) hide show

crieur/__init__.py +4 -0
crieur/__main__.py +3 -0
crieur/cli.py +169 -0
crieur/generator.py +181 -0
crieur/models.py +408 -0
crieur/plugins.py +110 -0
crieur/statics/font_caslon_pro.css +26 -0
crieur/statics/font_noto_sans.css +33 -0
crieur/statics/pico.css +2835 -0
crieur/styles/apa.csl +2133 -0
crieur/templates/article.html +44 -0
crieur/templates/author.html +52 -0
crieur/templates/authors.html +21 -0
crieur/templates/base.html +307 -0
crieur/templates/blog.html +23 -0
crieur/templates/homepage.html +99 -0
crieur/templates/keyword.html +49 -0
crieur/templates/keywords.html +24 -0
crieur/templates/numero.html +46 -0
crieur/templates/numeros.html +24 -0
crieur/typography.py +93 -0
crieur/utils.py +56 -0
crieur-2.0.2.dist-info/METADATA +838 -0
crieur-2.0.2.dist-info/RECORD +27 -0
crieur-2.0.2.dist-info/WHEEL +4 -0
crieur-2.0.2.dist-info/entry_points.txt +2 -0
crieur-2.0.2.dist-info/licenses/LICENSE +661 -0

crieur/models.py ADDED Viewed

@@ -0,0 +1,408 @@
+import re
+from dataclasses import dataclass
+from datetime import datetime
+from os import closerange
+from pathlib import Path
+from textwrap import dedent
+from typing import Optional
+import mistune
+from citeproc import (
+    Citation,
+    CitationItem,
+    CitationStylesBibliography,
+    CitationStylesStyle,
+    formatter,
+)
+from citeproc.source.bibtex import BibTeX
+from dataclass_wizard import DatePattern, DumpMeta, YAMLWizard
+from dataclass_wizard import errors as dw_errors
+from PIL import Image, UnidentifiedImageError
+from slugify import slugify
+from yaml.composer import ComposerError
+from .generator import mistune_plugins
+from .typography import typographie
+RE_CITATIONS_REFS = re.compile(r"\[\@(?P<ref>.*)\]")
+@dataclass
+class Settings:
+    title: str
+    base_url: str
+    extra_vars: str
+    target_path: Path
+    source_path: Path
+    statics_path: Path
+    templates_path: Path
+    csl_path: Path
+    without_statics: bool
+    feed_limit: int
+class FrenchTypographyRenderer(mistune.HTMLRenderer):
+    """Apply French typographic rules to text."""
+    def text(self, text):
+        text = text.replace("\\ ", " ")
+        return typographie(super().text(text), html=True)
+    def block_html(self, html):
+        html = html.replace("\\ ", " ")
+        return typographie(super().block_html(html), html=True)
+class ImgsWithSizesRenderer(FrenchTypographyRenderer):
+    """Renders images as <figure>s and add sizes."""
+    def __init__(self, escape=True, allow_harmful_protocols=None, article=None):
+        super().__init__(escape, allow_harmful_protocols)
+        self._article = article
+    def paragraph(self, text):
+        # In case of a figure, we do not want the (non-standard) paragraph.
+        if text.strip().startswith("<figure>"):
+            return text
+        return super().paragraph(text)
+    def image(self, text, url, title=None):
+        if self._article.images_path is None:
+            print(f"Image with URL `{url}` is discarded.")
+            return ""
+        full_path = self._article.images_path.resolve().parent / url
+        try:
+            image = Image.open(full_path)
+        except (IsADirectoryError, FileNotFoundError, UnidentifiedImageError):
+            print(f"`{full_path}` is not a valid image.")
+            return ""
+        width, height = image.size
+        caption = f"<figcaption>{text}</figcaption>" if text else ""
+        full_url = f"{self._article.settings.base_url}{self._article.url}{url}"
+        return dedent(
+            f"""\
+            <figure>
+                <a href="{full_url}"
+                    title="Cliquer pour une version haute résolution">
+                    <img
+                        src="{full_url}"
+                        width="{width}" height="{height}"
+                        loading="lazy"
+                        decoding="async"
+                        alt="{text}">
+                </a>
+                {caption}
+            </figure>
+            """
+        )
+@dataclass
+class Numero(YAMLWizard):
+    _id: str
+    name: str
+    description: str
+    metadata: str
+    articles: list
+    title: str = ""
+    title_f: str = ""
+    @property
+    def date(self):
+        return max(article.date for article in self.articles)
+    def __lt__(self, other: "Numero"):
+        if not isinstance(other, Numero):
+            return NotImplemented
+        return self.date < other.date
+    def __post_init__(self):
+        self.slug = slugify(self.name)
+    def configure_articles(self, yaml_path, settings):
+        # Preserves abstract_fr key (vs. abstract-fr) when converting to_yaml()
+        DumpMeta(key_transform="SNAKE").bind_to(Article)
+        loaded_articles = []
+        for article in self.articles:
+            article_slug = slugify(article["article"]["title"])
+            article_folder = (
+                yaml_path.parent / f"{article_slug}-{article['article']['_id']}"
+            )
+            article_yaml_path = article_folder / f"{article_slug}.yaml"
+            try:
+                try:
+                    loaded_article = Article.from_yaml_file(article_yaml_path)
+                except ComposerError:
+                    loaded_article = Article.from_yaml(
+                        article_yaml_path.read_text().split("---")[1]
+                    )
+            except dw_errors.ParseError as e:
+                print(f"Metadata error in `{article['article']['title']}`:")
+                print(e)
+                exit(1)
+            if not loaded_article.date:
+                print(f"Article `{loaded_article.title}` skipped (no date).")
+                continue
+            if loaded_article.date > datetime.today().date():
+                print(
+                    f"Article `{loaded_article.title}` skipped "
+                    f"(future date: {loaded_article.date})."
+                )
+                continue
+            if not loaded_article.id:
+                loaded_article.id = article_slug
+            loaded_article.content_md = (
+                article_folder / f"{article_slug}.md"
+            ).read_text()
+            loaded_article.content_bib_path = article_folder / f"{article_slug}.bib"
+            loaded_article.images_path = (
+                article_folder / "images"
+                if (article_folder / "images").exists()
+                else None
+            )
+            self.title = loaded_article.dossier[0]["title"]
+            self.title_f = loaded_article.dossier[0]["title_f"]
+            loaded_article.numero = self
+            loaded_article.settings = settings
+            loaded_articles.append(loaded_article)
+        self.articles = sorted(loaded_articles, reverse=True)
+@dataclass
+class Article(YAMLWizard):
+    title: str
+    title_f: str
+    id: str = ""
+    subtitle: str = ""
+    subtitle_f: str = ""
+    content_md: str = ""
+    content_bib_path: Path = ""
+    settings: dict | None = None
+    dossier: list | None = None
+    date: Optional[DatePattern["%Y/%m/%d"]] = None  # noqa: F722
+    authors: list = None
+    abstract: list = None
+    keywords: list = None
+    def __post_init__(self):
+        self.slug = slugify(self.title)
+        md = mistune.create_markdown(escape=False)
+        self.title_f = md(self.title_f).strip()[len("<p>") : -len("</p>")]
+        self.subtitle_f = md(self.subtitle_f).strip()[len("<p>") : -len("</p>")]
+    def __eq__(self, other):
+        return self.id == other.id
+    def __lt__(self, other: "Article"):
+        if not isinstance(other, Article):
+            return NotImplemented
+        return self.date < other.date
+    @property
+    def abstract_fr(self):
+        for abstract in self.abstract:
+            if abstract.get("text_f") and (
+                abstract.get("lang") == "fr" or abstract.get("lang") is None
+            ):
+                return abstract["text_f"]
+    @property
+    def abstract_en(self):
+        for abstract in self.abstract:
+            if abstract.get("text_f") and abstract.get("lang") == "en":
+                return abstract["text_f"]
+    @property
+    def url(self):
+        return f"numero/{self.numero.slug}/article/{self.id}/"
+    @property
+    def content_html(self):
+        md = mistune.create_markdown(
+            renderer=ImgsWithSizesRenderer(escape=False, article=self),
+            plugins=mistune_plugins,
+            escape=False,
+        )
+        html_content = md(self.content_md)
+        bib_source = BibTeX(self.content_bib_path, encoding="utf-8")
+        bib_style = CitationStylesStyle(self.settings.csl_path)
+        bibliography = CitationStylesBibliography(bib_style, bib_source, formatter.html)
+        # Processing citations in a document needs to be done in two passes as for some
+        # CSL styles, a citation can depend on the order of citations in the
+        # bibliography and thus on citations following the current one.
+        # For this reason, we first need to register all citations with the
+        # CitationStylesBibliography.
+        citations = {}
+        def clean_ref(citation_ref):
+            # TODO: deal with page references (for instance `[@goody_raison_1979, pp.115]`).
+            return citation_ref.split(",")[0]
+        for citation_ref in RE_CITATIONS_REFS.findall(html_content):
+            citation_ref = clean_ref(citation_ref)
+            citation = Citation([CitationItem(citation_ref)])
+            bibliography.register(citation)
+            citations[citation_ref] = citation
+        def warn(citation_item):
+            print(
+                "WARNING: Reference with key '{}' not found in the bibliography.".format(
+                    citation_item.key
+                )
+            )
+        # In the second pass, CitationStylesBibliography can generate citations.
+        # CitationStylesBibliography.cite() requires a callback function to be passed
+        # along to be called in case a CitationItem's key is not present in the
+        # bibliography.
+        def replace_reference(match_object):
+            citation_ref = match_object.group("ref")
+            citation_ref = clean_ref(citation_ref)
+            return "".join(
+                f"""
+                <a href="#ref_{citation_ref}" id="anchor_{citation_ref}">
+                    {bibliography.cite(citations[citation_ref], warn)}
+                </a>
+            """.split("\n")
+            )
+        html_content = re.sub(RE_CITATIONS_REFS, replace_reference, html_content)
+        html_bibliography = ""
+        def clean_item(item):
+            # As of 2025, citeproc-py does not support repeated punctuation.
+            return str(item).replace("..", ".").replace(".</i>.", ".</i>")
+        for citation, item in zip(bibliography.items, bibliography.bibliography()):
+            citation_ref = citation.reference.get("key")
+            cleaned_item = clean_item(item)
+            html_bibliography += f"""
+            <li>
+                <span id="ref_{citation_ref}">
+                    {cleaned_item}
+                    <a href="#anchor_{citation_ref}">↩</a>
+                </span>
+            </li>
+            """
+        html_content = html_content.replace(
+            "<h2>Bibliographie</h2>",
+            f"<h2>Bibliographie</h2>\n\n<ul>{html_bibliography}</ul>",
+        )
+        return html_content
+def configure_numero(yaml_path, settings):
+    # Preserves abstract_fr key (vs. abstract-fr) when converting to_yaml()
+    DumpMeta(key_transform="SNAKE").bind_to(Numero)
+    try:
+        numero = Numero.from_yaml_file(yaml_path)
+    except ComposerError:
+        numero = Numero.from_yaml(yaml_path.read_text().split("---")[1])
+    numero.configure_articles(yaml_path, settings)
+    return numero
+@dataclass
+class Keyword:
+    slug: str
+    name: str
+    articles: list
+    def __eq__(self, other):
+        return self.slug == other.slug
+    def __lt__(self, other: "Keyword"):
+        if not isinstance(other, Keyword):
+            return NotImplemented
+        len_self = len(self.articles)
+        len_other = len(other.articles)
+        if len_self == len_other:
+            return self.slug > other.slug
+        return len_self < len_other
+@dataclass
+class Author:
+    slug: str
+    forname: str
+    surname: str
+    articles: list
+    biography: str = ""
+    def __str__(self):
+        return f"{self.forname} {self.surname}"
+    def __eq__(self, other):
+        return self.slug == other.slug
+    def __lt__(self, other: "Author"):
+        if not isinstance(other, Author):
+            return NotImplemented
+        len_self = len(self.articles)
+        len_other = len(other.articles)
+        if len_self == len_other:
+            return self.slug > other.slug
+        return len_self < len_other
+def collect_keywords(numeros):
+    keywords = {}
+    for numero in numeros:
+        for article in numero.articles:
+            article_keywords = []
+            for kwds in article.keywords:
+                if kwds.get("list") and kwds.get("lang") == "fr":  # TODO: en?
+                    for keyword in kwds.get("list", "").split(", "):
+                        keyword_slug = slugify(keyword)
+                        if keyword_slug in keywords:
+                            keywords[keyword_slug].articles.append(article)
+                            kw = keywords[keyword_slug]
+                        else:
+                            kw = Keyword(
+                                slug=keyword_slug, name=keyword, articles=[article]
+                            )
+                            keywords[keyword_slug] = kw
+                        article_keywords.append(kw)
+            article.keywords = article_keywords
+    return dict(sorted(keywords.items(), key=lambda item: item[1], reverse=True))
+def collect_authors(numeros):
+    authors = {}
+    for numero in numeros:
+        for article in numero.articles:
+            article_authors = []
+            if not article.authors:
+                continue
+            for athr in article.authors:
+                author_forname = athr.get("forname", "")
+                author_surname = athr.get("surname", "")
+                author_biography = athr.get("biography", "")
+                author_name = f"{author_forname} {author_surname}".strip()
+                if not author_name:
+                    continue
+                author_slug = slugify(author_name)
+                if author_slug in authors:
+                    authors[author_slug].articles.append(article)
+                    kw = authors[author_slug]
+                else:
+                    kw = Author(
+                        slug=author_slug,
+                        forname=author_forname,
+                        surname=author_surname,
+                        articles=[article],
+                        biography=author_biography,
+                    )
+                    authors[author_slug] = kw
+                article_authors.append(kw)
+            article.authors = article_authors
+    return dict(sorted(authors.items(), key=lambda item: item[1], reverse=True))

crieur/plugins.py ADDED Viewed

@@ -0,0 +1,110 @@
+from typing import Any, Dict, List, Match, Union
+from mistune.core import BlockState
+__all__ = ["inline_footnotes"]
+# https://michelf.ca/projects/php-markdown/extra/#footnotes
+INLINE_FOOTNOTE = r"\^\[(?P<footnote_inlined>[^\]]*)\]"
+def parse_inline_footnote(
+    inline: "InlineParser", m: Match[str], state: "InlineState"
+) -> int:
+    key = m.group("footnote_inlined")
+    notes = state.env.get("inline_footnotes")
+    if not notes:
+        notes = []
+    if key not in notes:
+        notes.append(key)
+        state.env["inline_footnotes"] = notes
+    state.append_token(
+        {
+            "type": "footnote_ref",
+            "raw": key,
+            "attrs": {"index": notes.index(key) + 1},
+        }
+    )
+    return m.end()
+def parse_footnote_item(
+    block: "BlockParser", key: str, index: int, state: BlockState
+) -> Dict[str, Any]:
+    return {
+        "type": "footnote_item",
+        "children": [{"type": "paragraph", "text": key}],
+        "attrs": {"key": key, "index": index},
+    }
+def md_footnotes_hook(
+    md: "Markdown", result: Union[str, List[Dict[str, Any]]], state: BlockState
+) -> Union[str, List[Dict[str, Any]]]:
+    notes = state.env.get("inline_footnotes")
+    if not notes:
+        return result
+    children = [
+        parse_footnote_item(md.block, k, i + 1, state) for i, k in enumerate(notes)
+    ]
+    state = BlockState()
+    state.tokens = [{"type": "footnotes", "children": children}]
+    output = md.render_state(state)
+    return result + output  # type: ignore[operator]
+def render_inline_footnote_ref(renderer: "BaseRenderer", key: str, index: int) -> str:
+    i = str(index)
+    html = '<sup class="footnote-ref" id="fnref-' + i + '">'
+    return html + '<a href="#fn-' + i + '">' + i + "</a></sup>"
+def render_inline_footnotes(renderer: "BaseRenderer", text: str) -> str:
+    return '<hr><section class="footnotes">\n<ol>\n' + text + "</ol>\n</section>\n"
+def render_inline_footnote_item(
+    renderer: "BaseRenderer", text: str, key: str, index: int
+) -> str:
+    i = str(index)
+    back = '<a href="#fnref-' + i + '" class="footnote">&#8617;</a>'
+    text = text.rstrip()[:-4] + back + "</p>"
+    return '<li id="fn-' + i + '">' + text + "</li>\n"
+def inline_footnotes(md: "Markdown") -> None:
+    """A mistune plugin to support inline footnotes, spec defined at
+    https://michelf.ca/projects/php-markdown/extra/#footnotes
+    Here is an example:
+    .. code-block:: text
+        That's some text with a footnote.^[And that's the footnote.]
+    It will be converted into HTML:
+    .. code-block:: html
+        <p>That's some text with a footnote.<sup class="footnote-ref" id="fnref-1"><a href="#fn-1">1</a></sup></p>
+        <section class="footnotes">
+        <ol>
+        <li id="fn-1"><p>And that's the footnote.<a href="#fnref-1" class="footnote">&#8617;</a></p></li>
+        </ol>
+        </section>
+    :param md: Markdown instance
+    """
+    md.inline.register(
+        "inline_footnote",
+        INLINE_FOOTNOTE,
+        parse_inline_footnote,
+        before="link",
+    )
+    md.after_render_hooks.append(md_footnotes_hook)
+    if md.renderer and md.renderer.NAME == "html":
+        md.renderer.register("footnote_ref", render_inline_footnote_ref)
+        md.renderer.register("footnote_item", render_inline_footnote_item)
+        md.renderer.register("footnotes", render_inline_footnotes)