PyPI - markdown-to-confluence - Versions diffs - 0.5.2__py3-none-any.whl → 0.5.3__py3-none-any.whl - Mend

markdown-to-confluence 0.5.2py3-none-any.whl → 0.5.3py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (53) hide show

{markdown_to_confluence-0.5.2.dist-info → markdown_to_confluence-0.5.3.dist-info}/METADATA +80 -4
markdown_to_confluence-0.5.3.dist-info/RECORD +55 -0
{markdown_to_confluence-0.5.2.dist-info → markdown_to_confluence-0.5.3.dist-info}/licenses/LICENSE +1 -1
md2conf/__init__.py +2 -2
md2conf/__main__.py +42 -24
md2conf/api.py +27 -8
md2conf/attachment.py +72 -0
md2conf/coalesce.py +43 -0
md2conf/collection.py +1 -1
md2conf/{extra.py → compatibility.py} +1 -1
md2conf/converter.py +232 -649
md2conf/csf.py +13 -11
md2conf/drawio/__init__.py +0 -0
md2conf/drawio/extension.py +116 -0
md2conf/{drawio.py → drawio/render.py} +1 -1
md2conf/emoticon.py +3 -3
md2conf/environment.py +2 -2
md2conf/extension.py +78 -0
md2conf/external.py +49 -0
md2conf/formatting.py +135 -0
md2conf/frontmatter.py +70 -0
md2conf/image.py +127 -0
md2conf/latex.py +4 -183
md2conf/local.py +8 -8
md2conf/markdown.py +1 -1
md2conf/matcher.py +1 -1
md2conf/mermaid/__init__.py +0 -0
md2conf/mermaid/config.py +20 -0
md2conf/mermaid/extension.py +109 -0
md2conf/{mermaid.py → mermaid/render.py} +10 -38
md2conf/mermaid/scanner.py +55 -0
md2conf/metadata.py +1 -1
md2conf/{domain.py → options.py} +73 -16
md2conf/plantuml/__init__.py +0 -0
md2conf/plantuml/config.py +20 -0
md2conf/plantuml/extension.py +158 -0
md2conf/plantuml/render.py +139 -0
md2conf/plantuml/scanner.py +56 -0
md2conf/png.py +202 -0
md2conf/processor.py +32 -11
md2conf/publisher.py +14 -18
md2conf/scanner.py +31 -128
md2conf/serializer.py +2 -2
md2conf/svg.py +24 -2
md2conf/text.py +1 -1
md2conf/toc.py +1 -1
md2conf/uri.py +1 -1
md2conf/xml.py +1 -1
markdown_to_confluence-0.5.2.dist-info/RECORD +0 -36
{markdown_to_confluence-0.5.2.dist-info → markdown_to_confluence-0.5.3.dist-info}/WHEEL +0 -0
{markdown_to_confluence-0.5.2.dist-info → markdown_to_confluence-0.5.3.dist-info}/entry_points.txt +0 -0
{markdown_to_confluence-0.5.2.dist-info → markdown_to_confluence-0.5.3.dist-info}/top_level.txt +0 -0
{markdown_to_confluence-0.5.2.dist-info → markdown_to_confluence-0.5.3.dist-info}/zip-safe +0 -0

md2conf/converter.py CHANGED Viewed

@@ -1,13 +1,12 @@
 """
 Publish Markdown files to Confluence wiki.
-Copyright 2022-2025, Levente Hunyadi
+Copyright 2022-2026, Levente Hunyadi
 :see: https://github.com/hunyadi/md2conf
 """
-import dataclasses
-import enum
+import copy
 import hashlib
 import logging
 import os.path
@@ -16,26 +15,31 @@ import uuid
 from abc import ABC, abstractmethod
 from dataclasses import dataclass
 from pathlib import Path
-from typing import ClassVar, Literal
+from typing import ClassVar
 from urllib.parse import ParseResult, quote_plus, urlparse
 import lxml.etree as ET
-from cattrs import BaseValidationError
-from . import drawio, mermaid
+from .attachment import AttachmentCatalog, EmbeddedFileData, ImageData, attachment_name
+from .coalesce import coalesce
 from .collection import ConfluencePageCollection
+from .compatibility import override, path_relative_to
 from .csf import AC_ATTR, AC_ELEM, HTML, RI_ATTR, RI_ELEM, ParseError, elements_from_strings, elements_to_string, normalize_inline
-from .domain import ConfluenceDocumentOptions, ConfluencePageID
+from .drawio.extension import DrawioExtension
 from .emoticon import emoji_to_emoticon
 from .environment import PageError
-from .extra import override, path_relative_to
-from .latex import get_png_dimensions, remove_png_chunks, render_latex
+from .extension import ExtensionOptions, MarketplaceExtension
+from .formatting import FormattingContext, ImageAlignment, ImageAttributes
+from .image import ImageGenerator, ImageGeneratorOptions
+from .latex import render_latex
 from .markdown import markdown_to_html
-from .mermaid import MermaidConfigProperties
+from .mermaid.extension import MermaidExtension
 from .metadata import ConfluenceSiteMetadata
-from .scanner import MermaidScanner, ScannedDocument, Scanner
+from .options import ConfluencePageID, ConverterOptions, DocumentOptions
+from .plantuml.extension import PlantUMLExtension
+from .png import extract_png_dimensions, remove_png_chunks
+from .scanner import ScannedDocument, Scanner
 from .serializer import JsonType
-from .svg import fix_svg_dimensions, get_svg_dimensions, get_svg_dimensions_from_bytes
 from .toc import TableOfContentsBuilder
 from .uri import is_absolute_url, to_uuid_urn
 from .xml import element_to_text
@@ -47,20 +51,21 @@ def apply_generated_by_template(template: str, path: Path) -> str:
     """Apply template substitution to the generated_by string.
     Supported placeholders:
-    - %{filepath}: Full path to the file (relative to the root directory)
+    - %{filepath}: Full path to the file (relative to the source directory)
     - %{filename}: Just the filename
+    - %{filedir}: Dirname of the full path to the file (relative to the source directory)
+    - %{filestem}: Just the filename without the extension
     :param template: The template string with placeholders
     :param path: The path to the file being converted
     :returns: The template string with placeholders replaced
     """
-    return template.replace(
-        "%{filepath}",
-        path.as_posix(),
-    ).replace(
-        "%{filename}",
-        path.name,
+    return (
+        template.replace("%{filepath}", path.as_posix())
+        .replace("%{filename}", path.name)
+        .replace("%{filedir}", path.parent.as_posix())
+        .replace("%{filestem}", path.stem)
     )
@@ -166,7 +171,6 @@ _LANGUAGES = {
     "kotlin": "kotlin",
     "livescript": "livescript",
     "lua": "lua",
-    "mermaid": "mermaid",
     "mathematica": "mathematica",
     "matlab": "matlab",
     "objectivec": "objectivec",
@@ -271,170 +275,6 @@ def is_placeholder_for(node: ElementType, name: str) -> bool:
     return True
-@enum.unique
-class FormattingContext(enum.Enum):
-    "Identifies the formatting context for the element."
-    BLOCK = "block"
-    INLINE = "inline"
-@enum.unique
-class ImageAlignment(enum.Enum):
-    "Determines whether to align block-level images to center, left or right."
-    CENTER = "center"
-    LEFT = "left"
-    RIGHT = "right"
-@dataclass
-class ImageAttributes:
-    """
-    Attributes applied to an `<img>` element.
-    :param context: Identifies the formatting context for the element (block or inline).
-    :param width: Natural image width in pixels.
-    :param height: Natural image height in pixels.
-    :param alt: Alternate text.
-    :param title: Title text (a.k.a. image tooltip).
-    :param caption: Caption text (shown below figure).
-    :param alignment: Alignment for block-level images.
-    :param display_width: Constrained display width in pixels (if different from natural width).
-    """
-    context: FormattingContext
-    width: int | None
-    height: int | None
-    alt: str | None
-    title: str | None
-    caption: str | None
-    alignment: ImageAlignment = ImageAlignment.CENTER
-    display_width: int | None = None
-    def __post_init__(self) -> None:
-        if self.caption is None and self.context is FormattingContext.BLOCK:
-            self.caption = self.title or self.alt
-    def as_dict(self) -> dict[str, str]:
-        attributes: dict[str, str] = {}
-        if self.context is FormattingContext.BLOCK:
-            if self.alignment is ImageAlignment.LEFT:
-                attributes[AC_ATTR("align")] = "left"
-                attributes[AC_ATTR("layout")] = "align-start"
-            elif self.alignment is ImageAlignment.RIGHT:
-                attributes[AC_ATTR("align")] = "right"
-                attributes[AC_ATTR("layout")] = "align-end"
-            else:
-                attributes[AC_ATTR("align")] = "center"
-                attributes[AC_ATTR("layout")] = "center"
-            if self.width is not None:
-                attributes[AC_ATTR("original-width")] = str(self.width)
-            if self.height is not None:
-                attributes[AC_ATTR("original-height")] = str(self.height)
-            if self.width is not None:
-                attributes[AC_ATTR("custom-width")] = "true"
-                # Use display_width if set, otherwise use natural width
-                effective_width = self.display_width or self.width
-                attributes[AC_ATTR("width")] = str(effective_width)
-        elif self.context is FormattingContext.INLINE:
-            if self.width is not None:
-                attributes[AC_ATTR("width")] = str(self.width)
-            if self.height is not None:
-                attributes[AC_ATTR("height")] = str(self.height)
-        else:
-            raise NotImplementedError("match not exhaustive for enumeration")
-        if self.alt is not None:
-            attributes.update({AC_ATTR("alt"): self.alt})
-        if self.title is not None:
-            attributes.update({AC_ATTR("title"): self.title})
-        return attributes
-    EMPTY_BLOCK: ClassVar["ImageAttributes"]
-    EMPTY_INLINE: ClassVar["ImageAttributes"]
-    @classmethod
-    def empty(cls, context: FormattingContext) -> "ImageAttributes":
-        if context is FormattingContext.BLOCK:
-            return cls.EMPTY_BLOCK
-        elif context is FormattingContext.INLINE:
-            return cls.EMPTY_INLINE
-        else:
-            raise NotImplementedError("match not exhaustive for enumeration")
-ImageAttributes.EMPTY_BLOCK = ImageAttributes(
-    FormattingContext.BLOCK, width=None, height=None, alt=None, title=None, caption=None, alignment=ImageAlignment.CENTER
-)
-ImageAttributes.EMPTY_INLINE = ImageAttributes(
-    FormattingContext.INLINE, width=None, height=None, alt=None, title=None, caption=None, alignment=ImageAlignment.CENTER
-)
-@dataclass
-class ConfluenceConverterOptions:
-    """
-    Options for converting an HTML tree into Confluence storage format.
-    :param ignore_invalid_url: When true, ignore invalid URLs in input, emit a warning and replace the anchor with
-        plain text; when false, raise an exception.
-    :param heading_anchors: When true, emit a structured macro *anchor* for each section heading using GitHub
-        conversion rules for the identifier.
-    :param skip_title_heading: Whether to remove the first heading from document body when used as page title.
-    :param prefer_raster: Whether to choose PNG files over SVG files when available.
-    :param render_drawio: Whether to pre-render (or use the pre-rendered version of) draw.io diagrams.
-    :param render_mermaid: Whether to pre-render Mermaid diagrams into PNG/SVG images.
-    :param render_latex: Whether to pre-render LaTeX formulas into PNG/SVG images.
-    :param diagram_output_format: Target image format for diagrams.
-    :param webui_links: When true, convert relative URLs to Confluence Web UI links.
-    :param alignment: Alignment for block-level images and formulas.
-    :param max_image_width: Maximum display width for images in pixels.
-    :param use_panel: Whether to transform admonitions and alerts into a Confluence custom panel.
-    """
-    ignore_invalid_url: bool = False
-    heading_anchors: bool = False
-    skip_title_heading: bool = False
-    prefer_raster: bool = True
-    render_drawio: bool = False
-    render_mermaid: bool = False
-    render_latex: bool = False
-    diagram_output_format: Literal["png", "svg"] = "png"
-    webui_links: bool = False
-    alignment: Literal["center", "left", "right"] = "center"
-    max_image_width: int | None = None
-    use_panel: bool = False
-    def calculate_display_width(self, natural_width: int | None) -> int | None:
-        """
-        Calculate the display width for an image, applying max_image_width constraint if set.
-        :param natural_width: The natural width of the image in pixels.
-        :returns: The constrained display width, or None if no constraint is needed.
-        """
-        if natural_width is None or self.max_image_width is None:
-            return None
-        if natural_width <= self.max_image_width:
-            return None  # no constraint needed, image is already within limits
-        return self.max_image_width
-@dataclass
-class ImageData:
-    path: Path
-    description: str | None = None
-@dataclass
-class EmbeddedFileData:
-    data: bytes
-    description: str | None = None
 @dataclass
 class ConfluencePanel:
     emoji: str
@@ -475,20 +315,22 @@ ConfluencePanel.from_class = {
 class ConfluenceStorageFormatConverter(NodeVisitor):
     "Transforms a plain HTML tree into Confluence Storage Format."
-    options: ConfluenceConverterOptions
+    options: ConverterOptions
     path: Path
     base_dir: Path
     root_dir: Path
     toc: TableOfContentsBuilder
     links: list[str]
-    images: list[ImageData]
-    embedded_files: dict[str, EmbeddedFileData]
+    attachments: AttachmentCatalog
     site_metadata: ConfluenceSiteMetadata
     page_metadata: ConfluencePageCollection
+    image_generator: ImageGenerator
+    extensions: list[MarketplaceExtension]
     def __init__(
         self,
-        options: ConfluenceConverterOptions,
+        options: ConverterOptions,
         path: Path,
         root_dir: Path,
         site_metadata: ConfluenceSiteMetadata,
@@ -505,11 +347,22 @@ class ConfluenceStorageFormatConverter(NodeVisitor):
         self.root_dir = root_dir
         self.toc = TableOfContentsBuilder()
         self.links = []
-        self.images = []
-        self.embedded_files = {}
+        self.attachments = AttachmentCatalog()
         self.site_metadata = site_metadata
         self.page_metadata = page_metadata
+        self.image_generator = ImageGenerator(
+            self.base_dir,
+            self.attachments,
+            ImageGeneratorOptions(self.options.diagram_output_format, self.options.prefer_raster, self.options.layout.image.max_width),
+        )
+        self.extensions = [
+            DrawioExtension(self.image_generator, ExtensionOptions(render=self.options.render_drawio)),
+            MermaidExtension(self.image_generator, ExtensionOptions(render=self.options.render_mermaid)),
+            PlantUMLExtension(self.image_generator, ExtensionOptions(render=self.options.render_plantuml)),
+        ]
     def _transform_heading(self, heading: ElementType) -> None:
         """
         Adds anchors to headings in the same document (if *heading anchors* is enabled).
@@ -660,7 +513,7 @@ class ConfluenceStorageFormatConverter(NodeVisitor):
             return None
         file_name = attachment_name(path_relative_to(absolute_path, self.base_dir))
-        self.images.append(ImageData(absolute_path))
+        self.attachments.add_image(ImageData(absolute_path))
         link_body = AC_ELEM("link-body", {}, *list(anchor))
         link_body.text = anchor.text
@@ -728,8 +581,7 @@ class ConfluenceStorageFormatConverter(NodeVisitor):
             alt=alt,
             title=title,
             caption=None,
-            alignment=ImageAlignment(self.options.alignment),
-            display_width=self.options.calculate_display_width(pixel_width),
+            alignment=ImageAlignment(self.options.layout.get_image_alignment()),
         )
         if is_absolute_url(src):
@@ -741,14 +593,11 @@ class ConfluenceStorageFormatConverter(NodeVisitor):
             if absolute_path is None:
                 return self._create_missing(path, attrs)
-            if absolute_path.name.endswith(".drawio.png") or absolute_path.name.endswith(".drawio.svg"):
-                return self._transform_drawio_image(absolute_path, attrs)
-            elif absolute_path.name.endswith(".drawio.xml") or absolute_path.name.endswith(".drawio"):
-                return self._transform_drawio(absolute_path, attrs)
-            elif absolute_path.name.endswith(".mmd") or absolute_path.name.endswith(".mermaid"):
-                return self._transform_external_mermaid(absolute_path, attrs)
-            else:
-                return self._transform_attached_image(absolute_path, attrs)
+            for extension in self.extensions:
+                if extension.matches_image(absolute_path):
+                    return extension.transform_image(absolute_path, attrs)
+            return self.image_generator.transform_attached_image(absolute_path, attrs)
     def _transform_external_image(self, url: str, attrs: ImageAttributes) -> ElementType:
         "Emits Confluence Storage Format XHTML for an external image."
@@ -764,7 +613,7 @@ class ConfluenceStorageFormatConverter(NodeVisitor):
         if attrs.caption:
             elements.append(AC_ELEM("caption", attrs.caption))
-        return AC_ELEM("image", attrs.as_dict(), *elements)
+        return AC_ELEM("image", attrs.as_dict(max_width=self.options.layout.image.max_width), *elements)
     def _warn_or_raise(self, msg: str) -> None:
         "Emit a warning or raise an exception when a path points to a resource that doesn't exist or is outside of the permitted hierarchy."
@@ -793,132 +642,6 @@ class ConfluenceStorageFormatConverter(NodeVisitor):
         return absolute_path
-    def _transform_attached_image(self, absolute_path: Path, attrs: ImageAttributes) -> ElementType:
-        "Emits Confluence Storage Format XHTML for an attached raster or vector image."
-        if self.options.prefer_raster and absolute_path.suffix == ".svg":
-            # prefer PNG over SVG; Confluence displays SVG in wrong size, and text labels are truncated
-            png_file = absolute_path.with_suffix(".png")
-            if png_file.exists():
-                absolute_path = png_file
-        # infer SVG dimensions if not already specified
-        if absolute_path.suffix == ".svg" and attrs.width is None and attrs.height is None:
-            svg_width, svg_height = get_svg_dimensions(absolute_path)
-            if svg_width is not None:
-                attrs = ImageAttributes(
-                    context=attrs.context,
-                    width=svg_width,
-                    height=svg_height,
-                    alt=attrs.alt,
-                    title=attrs.title,
-                    caption=attrs.caption,
-                    alignment=attrs.alignment,
-                    display_width=self.options.calculate_display_width(svg_width),
-                )
-        self.images.append(ImageData(absolute_path, attrs.alt))
-        image_name = attachment_name(path_relative_to(absolute_path, self.base_dir))
-        return self._create_attached_image(image_name, attrs)
-    def _transform_drawio(self, absolute_path: Path, attrs: ImageAttributes) -> ElementType:
-        "Emits Confluence Storage Format XHTML for a draw.io diagram."
-        if not absolute_path.name.endswith(".drawio.xml") and not absolute_path.name.endswith(".drawio"):
-            raise DocumentError("invalid image format; expected: `*.drawio.xml` or `*.drawio`")
-        relative_path = path_relative_to(absolute_path, self.base_dir)
-        if self.options.render_drawio:
-            image_data = drawio.render_diagram(absolute_path, self.options.diagram_output_format)
-            image_filename = attachment_name(relative_path.with_suffix(f".{self.options.diagram_output_format}"))
-            self.embedded_files[image_filename] = EmbeddedFileData(image_data, attrs.alt)
-            return self._create_attached_image(image_filename, attrs)
-        else:
-            self.images.append(ImageData(absolute_path, attrs.alt))
-            image_filename = attachment_name(relative_path)
-            return self._create_drawio(image_filename, attrs)
-    def _transform_drawio_image(self, absolute_path: Path, attrs: ImageAttributes) -> ElementType:
-        "Emits Confluence Storage Format XHTML for a draw.io diagram embedded in a PNG or SVG image."
-        if not absolute_path.name.endswith(".drawio.png") and not absolute_path.name.endswith(".drawio.svg"):
-            raise DocumentError("invalid image format; expected: `*.drawio.png` or `*.drawio.svg`")
-        if self.options.render_drawio:
-            return self._transform_attached_image(absolute_path, attrs)
-        else:
-            # extract embedded editable diagram and upload as *.drawio
-            image_data = drawio.extract_diagram(absolute_path)
-            image_filename = attachment_name(path_relative_to(absolute_path.with_suffix(".xml"), self.base_dir))
-            self.embedded_files[image_filename] = EmbeddedFileData(image_data, attrs.alt)
-            return self._create_drawio(image_filename, attrs)
-    def _create_attached_image(self, image_name: str, attrs: ImageAttributes) -> ElementType:
-        "An image embedded into the page, linking to an attachment."
-        elements: list[ElementType] = []
-        elements.append(
-            RI_ELEM(
-                "attachment",
-                # refers to an attachment uploaded alongside the page
-                {RI_ATTR("filename"): image_name},
-            )
-        )
-        if attrs.caption:
-            elements.append(AC_ELEM("caption", attrs.caption))
-        return AC_ELEM("image", attrs.as_dict(), *elements)
-    def _create_drawio(self, filename: str, attrs: ImageAttributes) -> ElementType:
-        "A draw.io diagram embedded into the page, linking to an attachment."
-        parameters: list[ElementType] = [
-            AC_ELEM(
-                "parameter",
-                {AC_ATTR("name"): "diagramName"},
-                filename,
-            ),
-        ]
-        if attrs.width is not None:
-            parameters.append(
-                AC_ELEM(
-                    "parameter",
-                    {AC_ATTR("name"): "width"},
-                    str(attrs.width),
-                ),
-            )
-        if attrs.height is not None:
-            parameters.append(
-                AC_ELEM(
-                    "parameter",
-                    {AC_ATTR("name"): "height"},
-                    str(attrs.height),
-                ),
-            )
-        if attrs.alignment is ImageAlignment.CENTER:
-            parameters.append(
-                AC_ELEM(
-                    "parameter",
-                    {AC_ATTR("name"): "pCenter"},
-                    str(1),
-                ),
-            )
-        local_id = str(uuid.uuid4())
-        macro_id = str(uuid.uuid4())
-        return AC_ELEM(
-            "structured-macro",
-            {
-                AC_ATTR("name"): "drawio",
-                AC_ATTR("schema-version"): "1",
-                "data-layout": "default",
-                AC_ATTR("local-id"): local_id,
-                AC_ATTR("macro-id"): macro_id,
-            },
-            *parameters,
-        )
     def _create_missing(self, path: Path, attrs: ImageAttributes) -> ElementType:
         "A warning panel for a missing image."
@@ -950,6 +673,9 @@ class ConfluenceStorageFormatConverter(NodeVisitor):
     def _transform_code_block(self, code: ElementType) -> ElementType:
         "Transforms a code block."
+        content: str = code.text or ""
+        content = content.rstrip()
         if language_class := code.get("class"):
             if m := re.match("^language-(.*)$", language_class):
                 language_name = m.group(1)
@@ -960,16 +686,14 @@ class ConfluenceStorageFormatConverter(NodeVisitor):
         # translate name to standard name for (programming) language
         if language_name is not None:
+            for extension in self.extensions:
+                if extension.matches_fenced(language_name, content):
+                    return extension.transform_fenced(content)
             language_id = _LANGUAGES.get(language_name)
         else:
             language_id = None
-        content: str = code.text or ""
-        content = content.rstrip()
-        if language_id == "mermaid":
-            return self._transform_fenced_mermaid(content)
         return AC_ELEM(
             "structured-macro",
             {
@@ -984,126 +708,6 @@ class ConfluenceStorageFormatConverter(NodeVisitor):
             AC_ELEM("plain-text-body", ET.CDATA(content)),
         )
-    def _extract_mermaid_config(self, content: str) -> MermaidConfigProperties | None:
-        """Extract scale from Mermaid YAML front matter configuration."""
-        try:
-            properties = MermaidScanner().read(content)
-            return properties.config
-        except BaseValidationError as ex:
-            LOGGER.warning("Failed to extract Mermaid properties: %s", ex)
-            return None
-    def _transform_external_mermaid(self, absolute_path: Path, attrs: ImageAttributes) -> ElementType:
-        "Emits Confluence Storage Format XHTML for a Mermaid diagram read from an external file."
-        if not absolute_path.name.endswith(".mmd") and not absolute_path.name.endswith(".mermaid"):
-            raise DocumentError("invalid image format; expected: `*.mmd` or `*.mermaid`")
-        relative_path = path_relative_to(absolute_path, self.base_dir)
-        if self.options.render_mermaid:
-            with open(absolute_path, "r", encoding="utf-8") as f:
-                content = f.read()
-            config = self._extract_mermaid_config(content)
-            image_data = mermaid.render_diagram(content, self.options.diagram_output_format, config=config)
-            # Extract dimensions and fix SVG if that's the output format
-            if self.options.diagram_output_format == "svg":
-                # Fix SVG to have explicit width/height instead of percentages
-                image_data = fix_svg_dimensions(image_data)
-                if attrs.width is None and attrs.height is None:
-                    svg_width, svg_height = get_svg_dimensions_from_bytes(image_data)
-                    if svg_width is not None or svg_height is not None:
-                        attrs = ImageAttributes(
-                            context=attrs.context,
-                            width=svg_width,
-                            height=svg_height,
-                            alt=attrs.alt,
-                            title=attrs.title,
-                            caption=attrs.caption,
-                            alignment=attrs.alignment,
-                            display_width=self.options.calculate_display_width(svg_width),
-                        )
-            image_filename = attachment_name(relative_path.with_suffix(f".{self.options.diagram_output_format}"))
-            self.embedded_files[image_filename] = EmbeddedFileData(image_data, attrs.alt)
-            return self._create_attached_image(image_filename, attrs)
-        else:
-            self.images.append(ImageData(absolute_path, attrs.alt))
-            mermaid_filename = attachment_name(relative_path)
-            return self._create_mermaid_embed(mermaid_filename)
-    def _transform_fenced_mermaid(self, content: str) -> ElementType:
-        "Emits Confluence Storage Format XHTML for a Mermaid diagram defined in a fenced code block."
-        if self.options.render_mermaid:
-            config = self._extract_mermaid_config(content)
-            image_data = mermaid.render_diagram(content, self.options.diagram_output_format, config=config)
-            # Extract dimensions and fix SVG if that's the output format
-            attrs = ImageAttributes.EMPTY_BLOCK
-            if self.options.diagram_output_format == "svg":
-                # Fix SVG to have explicit width/height instead of percentages
-                image_data = fix_svg_dimensions(image_data)
-                svg_width, svg_height = get_svg_dimensions_from_bytes(image_data)
-                if svg_width is not None or svg_height is not None:
-                    attrs = ImageAttributes(
-                        context=FormattingContext.BLOCK,
-                        width=svg_width,
-                        height=svg_height,
-                        alt=None,
-                        title=None,
-                        caption=None,
-                        alignment=ImageAlignment(self.options.alignment),
-                        display_width=self.options.calculate_display_width(svg_width),
-                    )
-            image_hash = hashlib.md5(image_data).hexdigest()
-            image_filename = attachment_name(f"embedded_{image_hash}.{self.options.diagram_output_format}")
-            self.embedded_files[image_filename] = EmbeddedFileData(image_data)
-            return self._create_attached_image(image_filename, attrs)
-        else:
-            mermaid_data = content.encode("utf-8")
-            mermaid_hash = hashlib.md5(mermaid_data).hexdigest()
-            mermaid_filename = attachment_name(f"embedded_{mermaid_hash}.mmd")
-            self.embedded_files[mermaid_filename] = EmbeddedFileData(mermaid_data)
-            return self._create_mermaid_embed(mermaid_filename)
-    def _create_mermaid_embed(self, filename: str) -> ElementType:
-        "A Mermaid diagram, linking to an attachment that captures the Mermaid source."
-        local_id = str(uuid.uuid4())
-        macro_id = str(uuid.uuid4())
-        return AC_ELEM(
-            "structured-macro",
-            {
-                AC_ATTR("name"): "mermaid-cloud",
-                AC_ATTR("schema-version"): "1",
-                "data-layout": "default",
-                AC_ATTR("local-id"): local_id,
-                AC_ATTR("macro-id"): macro_id,
-            },
-            AC_ELEM(
-                "parameter",
-                {AC_ATTR("name"): "filename"},
-                filename,
-            ),
-            AC_ELEM(
-                "parameter",
-                {AC_ATTR("name"): "toolbar"},
-                "bottom",
-            ),
-            AC_ELEM(
-                "parameter",
-                {AC_ATTR("name"): "zoom"},
-                "fit",
-            ),
-            AC_ELEM("parameter", {AC_ATTR("name"): "revision"}, "1"),
-        )
     def _transform_toc(self, code: ElementType) -> ElementType:
         "Creates a table of contents, constructed from headings in the document."
@@ -1420,7 +1024,7 @@ class ConfluenceStorageFormatConverter(NodeVisitor):
         image_data = render_latex(content, format=self.options.diagram_output_format)
         if self.options.diagram_output_format == "png":
-            width, height = get_png_dimensions(data=image_data)
+            width, height = extract_png_dimensions(data=image_data)
             image_data = remove_png_chunks(["pHYs"], source_data=image_data)
             attrs = ImageAttributes(
                 context,
@@ -1429,16 +1033,15 @@ class ConfluenceStorageFormatConverter(NodeVisitor):
                 alt=content,
                 title=None,
                 caption="",
-                alignment=ImageAlignment(self.options.alignment),
-                display_width=self.options.calculate_display_width(width),
+                alignment=ImageAlignment(self.options.layout.get_image_alignment()),
             )
         else:
             attrs = ImageAttributes.empty(context)
         image_hash = hashlib.md5(image_data).hexdigest()
         image_filename = attachment_name(f"formula_{image_hash}.{self.options.diagram_output_format}")
-        self.embedded_files[image_filename] = EmbeddedFileData(image_data, content)
-        image = self._create_attached_image(image_filename, attrs)
+        self.attachments.add_embed(image_filename, EmbeddedFileData(image_data, content))
+        image = self.image_generator.create_attached_image(image_filename, attrs)
         return image
     def _transform_inline_math(self, elem: ElementType) -> ElementType:
@@ -1472,7 +1075,7 @@ class ConfluenceStorageFormatConverter(NodeVisitor):
                 {AC_ATTR("name"): "body"},
                 content,
             ),
-            AC_ELEM("parameter", {AC_ATTR("name"): "align"}, self.options.alignment),
+            AC_ELEM("parameter", {AC_ATTR("name"): "align"}, self.options.layout.get_image_alignment()),
         )
         return macro
@@ -1509,7 +1112,7 @@ class ConfluenceStorageFormatConverter(NodeVisitor):
                 {AC_ATTR("name"): "body"},
                 content,
             ),
-            AC_ELEM("parameter", {AC_ATTR("name"): "align"}, self.options.alignment),
+            AC_ELEM("parameter", {AC_ATTR("name"): "align"}, self.options.layout.get_image_alignment()),
         )
     def _transform_footnote_ref(self, elem: ElementType) -> None:
@@ -1761,162 +1364,174 @@ class ConfluenceStorageFormatConverter(NodeVisitor):
         if not isinstance(child.tag, str):
             return None
-        # <p>...</p>
-        if child.tag == "p":
-            # <p><img src="..." /></p>
-            if len(child) == 1 and not child.text and child[0].tag == "img" and not child[0].tail:
-                return self._transform_image(FormattingContext.BLOCK, child[0])
-            # <p>[[<em>TOC</em>]]</p> (represented in Markdown as `[[_TOC_]]`)
-            elif is_placeholder_for(child, "TOC"):
-                return self._transform_toc(child)
-            # <p>[[<em>LISTING</em>]]</p> (represented in Markdown as `[[_LISTING_]]`)
-            elif is_placeholder_for(child, "LISTING"):
-                return self._transform_listing(child)
-        # <div>...</div>
-        elif child.tag == "div":
-            classes = child.get("class", "").split(" ")
-            # <div class="arithmatex">...</div>
-            if "arithmatex" in classes:
-                return self._transform_block_math(child)
-            # <div><ac:structured-macro ...>...</ac:structured-macro></div>
-            elif "csf" in classes:
-                if len(child) != 1:
-                    raise DocumentError("expected: single child in Confluence Storage Format block")
-                return child[0]
-            # <div class="footnote">
-            #   <hr/>
-            #   <ol>
-            #     <li id="fn:NAME"><p>TEXT <a class="footnote-backref" href="#fnref:NAME">↩</a></p></li>
-            #   </ol>
-            # </div>
-            elif "footnote" in classes:
-                self._transform_footnote_def(child)
-                return None
-            # <div class="admonition note">
-            # <p class="admonition-title">Note</p>
+        match child.tag:
             # <p>...</p>
-            # </div>
-            #
-            # --- OR ---
-            #
-            # <div class="admonition note">
-            # <p>...</p>
-            # </div>
-            elif "admonition" in classes:
-                return self._transform_admonition(child)
-        # <blockquote>...</blockquote>
-        elif child.tag == "blockquote":
-            # Alerts in GitHub
-            # <blockquote>
-            #   <p>[!TIP] ...</p>
-            # </blockquote>
-            if len(child) > 0 and child[0].tag == "p" and child[0].text is not None and child[0].text.startswith("[!"):
-                return self._transform_github_alert(child)
-            # Alerts in GitLab
-            # <blockquote>
-            #   <p>DISCLAIMER: ...</p>
-            # </blockquote>
-            elif len(child) > 0 and child[0].tag == "p" and element_text_starts_with_any(child[0], ["FLAG:", "NOTE:", "WARNING:", "DISCLAIMER:"]):
-                return self._transform_gitlab_alert(child)
-        # <details markdown="1">
-        # <summary>...</summary>
-        # ...
-        # </details>
-        elif child.tag == "details" and len(child) > 1 and child[0].tag == "summary":
-            return self._transform_collapsed(child)
-        # <ol>...</ol>
-        elif child.tag == "ol":
-            # Confluence adds the attribute `start` for every ordered list
-            child.set("start", "1")
-            return None
+            case "p":
+                # <p><img src="..." /></p>
+                if len(child) == 1 and not child.text and child[0].tag == "img" and not child[0].tail:
+                    return self._transform_image(FormattingContext.BLOCK, child[0])
+                # <p>[[<em>TOC</em>]]</p> (represented in Markdown as `[[_TOC_]]`)
+                elif is_placeholder_for(child, "TOC"):
+                    return self._transform_toc(child)
+                # <p>[[<em>LISTING</em>]]</p> (represented in Markdown as `[[_LISTING_]]`)
+                elif is_placeholder_for(child, "LISTING"):
+                    return self._transform_listing(child)
+            # <div>...</div>
+            case "div":
+                classes = child.get("class", "").split(" ")
+                # <div class="arithmatex">...</div>
+                if "arithmatex" in classes:
+                    return self._transform_block_math(child)
+                # <div><ac:structured-macro ...>...</ac:structured-macro></div>
+                elif "csf" in classes:
+                    if len(child) != 1:
+                        raise DocumentError("expected: single child in Confluence Storage Format block")
+                    return child[0]
+                # <div class="footnote">
+                #   <hr/>
+                #   <ol>
+                #     <li id="fn:NAME"><p>TEXT <a class="footnote-backref" href="#fnref:NAME">↩</a></p></li>
+                #   </ol>
+                # </div>
+                elif "footnote" in classes:
+                    self._transform_footnote_def(child)
+                    return None
+                # <div class="admonition note">
+                # <p class="admonition-title">Note</p>
+                # <p>...</p>
+                # </div>
+                #
+                # --- OR ---
+                #
+                # <div class="admonition note">
+                # <p>...</p>
+                # </div>
+                elif "admonition" in classes:
+                    return self._transform_admonition(child)
+            # <blockquote>...</blockquote>
+            case "blockquote":
+                # Alerts in GitHub
+                # <blockquote>
+                #   <p>[!TIP] ...</p>
+                # </blockquote>
+                if len(child) > 0 and child[0].tag == "p" and child[0].text is not None and child[0].text.startswith("[!"):
+                    return self._transform_github_alert(child)
+                # Alerts in GitLab
+                # <blockquote>
+                #   <p>DISCLAIMER: ...</p>
+                # </blockquote>
+                elif len(child) > 0 and child[0].tag == "p" and element_text_starts_with_any(child[0], ["FLAG:", "NOTE:", "WARNING:", "DISCLAIMER:"]):
+                    return self._transform_gitlab_alert(child)
+            # <details markdown="1">
+            # <summary>...</summary>
+            # ...
+            # </details>
+            case "details" if len(child) > 1 and child[0].tag == "summary":
+                return self._transform_collapsed(child)
-        # <ul>
-        #   <li>[ ] ...</li>
-        #   <li>[x] ...</li>
-        # </ul>
-        elif child.tag == "ul":
-            if len(child) > 0 and all(element_text_starts_with_any(item, ["[ ]", "[x]", "[X]"]) for item in child):
-                return self._transform_tasklist(child)
+            # <ol>...</ol>
+            case "ol":
+                # Confluence adds the attribute `start` for every ordered list
+                child.set("start", "1")
+                return None
-            return None
+            # <ul>
+            #   <li>[ ] ...</li>
+            #   <li>[x] ...</li>
+            # </ul>
+            case "ul":
+                if len(child) > 0 and all(element_text_starts_with_any(item, ["[ ]", "[x]", "[X]"]) for item in child):
+                    return self._transform_tasklist(child)
-        elif child.tag == "li":
-            normalize_inline(child)
-            return None
+                return None
+            case "li":
+                normalize_inline(child)
+                return None
-        # <pre><code class="language-java"> ... </code></pre>
-        elif child.tag == "pre" and len(child) == 1 and child[0].tag == "code":
-            return self._transform_code_block(child[0])
+            # <pre><code class="language-java"> ... </code></pre>
+            case "pre" if len(child) == 1 and child[0].tag == "code":
+                return self._transform_code_block(child[0])
+            # <table>...</table>
+            case "table":
+                for td in child.iterdescendants("td", "th"):
+                    normalize_inline(td)
+                match self.options.layout.alignment:
+                    case "left":
+                        layout = "align-start"
+                    case _:
+                        layout = "default"
+                child.set("data-layout", layout)
+                if self.options.layout.table.display_mode == "fixed":
+                    child.set("data-table-display-mode", "fixed")
+                if self.options.layout.table.width:
+                    child.set("data-table-width", str(self.options.layout.table.width))
-        # <table>...</table>
-        elif child.tag == "table":
-            for td in child.iterdescendants("td", "th"):
-                normalize_inline(td)
-            child.set("data-layout", "default")
-            return None
+                return None
-        # <img src="..." alt="..." />
-        elif child.tag == "img":
-            return self._transform_image(FormattingContext.INLINE, child)
+            # <img src="..." alt="..." />
+            case "img":
+                return self._transform_image(FormattingContext.INLINE, child)
-        # <a href="..."> ... </a>
-        elif child.tag == "a":
-            return self._transform_link(child)
+            # <a href="..."> ... </a>
+            case "a":
+                return self._transform_link(child)
-        # <mark>...</mark>
-        elif child.tag == "mark":
-            return self._transform_mark(child)
+            # <mark>...</mark>
+            case "mark":
+                return self._transform_mark(child)
-        # <span>...</span>
-        elif child.tag == "span":
-            classes = child.get("class", "").split(" ")
+            # <span>...</span>
+            case "span":
+                classes = child.get("class", "").split(" ")
-            # <span class="arithmatex">...</span>
-            if "arithmatex" in classes:
-                return self._transform_inline_math(child)
+                # <span class="arithmatex">...</span>
+                if "arithmatex" in classes:
+                    return self._transform_inline_math(child)
-        # <sup id="fnref:NAME"><a class="footnote-ref" href="#fn:NAME">1</a></sup>
-        # Multiple references: <sup id="fnref2:NAME">...</sup>, <sup id="fnref3:NAME">...</sup>
-        elif child.tag == "sup" and re.match(r"^fnref\d*:", child.get("id", "")):
-            self._transform_footnote_ref(child)
-            return None
+            # <sup id="fnref:NAME"><a class="footnote-ref" href="#fn:NAME">1</a></sup>
+            # Multiple references: <sup id="fnref2:NAME">...</sup>, <sup id="fnref3:NAME">...</sup>
+            case "sup" if re.match(r"^fnref\d*:", child.get("id", "")):
+                self._transform_footnote_ref(child)
+                return None
-        # <input type="date" value="1984-01-01" />
-        elif child.tag == "input" and child.get("type", "") == "date":
-            return HTML("time", {"datetime": child.get("value", "")})
+            # <input type="date" value="1984-01-01" />
+            case "input" if child.get("type", "") == "date":
+                return HTML("time", {"datetime": child.get("value", "")})
-        # <ins>...</ins>
-        elif child.tag == "ins":
-            # Confluence prefers <u> over <ins> for underline, and replaces <ins> with <u>
-            child.tag = "u"
+            # <ins>...</ins>
+            case "ins":
+                # Confluence prefers <u> over <ins> for underline, and replaces <ins> with <u>
+                child.tag = "u"
-        # <x-emoji data-shortname="wink" data-unicode="1f609">😉</x-emoji>
-        elif child.tag == "x-emoji":
-            return self._transform_emoji(child)
+            # <x-emoji data-shortname="wink" data-unicode="1f609">😉</x-emoji>
+            case "x-emoji":
+                return self._transform_emoji(child)
-        # <h1>...</h1>
-        # <h2>...</h2> ...
-        m = re.match(r"^h([1-6])$", child.tag, flags=re.IGNORECASE)
-        if m is not None:
-            level = int(m.group(1))
-            title = element_to_text(child)
-            self.toc.add(level, title)
+            # <h1>...</h1>
+            # <h2>...</h2> ...
+            case "h1" | "h2" | "h3" | "h4" | "h5" | "h6":
+                level = int(child.tag[1:])
+                title = element_to_text(child)
+                self.toc.add(level, title)
-            if self.options.heading_anchors:
-                self._transform_heading(child)
-                return None
+                if self.options.heading_anchors:
+                    self._transform_heading(child)
+                    return None
+            case _:
+                pass
         return None
@@ -1940,14 +1555,14 @@ class ConfluenceDocument:
     images: list[ImageData]
     embedded_files: dict[str, EmbeddedFileData]
-    options: ConfluenceDocumentOptions
+    options: DocumentOptions
     root: ElementType
     @classmethod
     def create(
         cls,
         path: Path,
-        options: ConfluenceDocumentOptions,
+        options: DocumentOptions,
         root_dir: Path,
         site_metadata: ConfluenceSiteMetadata,
         page_metadata: ConfluencePageCollection,
@@ -1955,9 +1570,10 @@ class ConfluenceDocument:
         path = path.resolve(True)
         document = Scanner().read(path)
+        props = document.properties
-        if document.page_id is not None:
-            page_id = ConfluencePageID(document.page_id)
+        if props.page_id is not None:
+            page_id = ConfluencePageID(props.page_id)
         else:
             # look up Confluence page ID in metadata
             metadata = page_metadata.get(path)
@@ -1972,13 +1588,14 @@ class ConfluenceDocument:
         self,
         path: Path,
         document: ScannedDocument,
-        options: ConfluenceDocumentOptions,
+        options: DocumentOptions,
         root_dir: Path,
         site_metadata: ConfluenceSiteMetadata,
         page_metadata: ConfluencePageCollection,
     ) -> None:
         "Converts a single Markdown document to Confluence Storage Format."
+        props = document.properties
         self.options = options
         # register auxiliary URL substitutions
@@ -1992,7 +1609,7 @@ class ConfluenceDocument:
         # modify HTML as necessary
         if self.options.generated_by is not None:
-            generated_by = document.generated_by or self.options.generated_by
+            generated_by = props.generated_by or self.options.generated_by
         else:
             generated_by = None
@@ -2016,11 +1633,9 @@ class ConfluenceDocument:
             raise ConversionError(path) from ex
         # configure HTML-to-Confluence converter
-        converter_options = ConfluenceConverterOptions(
-            **{field.name: getattr(self.options, field.name) for field in dataclasses.fields(ConfluenceConverterOptions)}
-        )
-        if document.alignment is not None:
-            converter_options.alignment = document.alignment
+        converter_options = copy.deepcopy(self.options.converter)
+        if props.layout is not None:
+            converter_options.layout = coalesce(props.layout, converter_options.layout)
         converter = ConfluenceStorageFormatConverter(converter_options, path, root_dir, site_metadata, page_metadata)
         # execute HTML-to-Confluence converter
@@ -2031,19 +1646,19 @@ class ConfluenceDocument:
         # extract information discovered by converter
         self.links = converter.links
-        self.images = converter.images
-        self.embedded_files = converter.embedded_files
+        self.images = converter.attachments.images
+        self.embedded_files = converter.attachments.embedded_files
         # assign global properties for document
-        self.title = document.title or converter.toc.get_title()
-        self.labels = document.tags
-        self.properties = document.properties
+        self.title = props.title or converter.toc.get_title()
+        self.labels = props.tags
+        self.properties = props.properties
         # Remove the first heading if:
         # 1. The option is enabled
         # 2. Title was NOT from front-matter (document.title is None)
         # 3. A title was successfully extracted from heading (self.title is not None)
-        if converter_options.skip_title_heading and document.title is None and self.title is not None:
+        if converter_options.skip_title_heading and props.title is None and self.title is not None:
             self._remove_first_heading()
     def _remove_first_heading(self) -> None:
@@ -2094,35 +1709,3 @@ class ConfluenceDocument:
     def xhtml(self) -> str:
         return elements_to_string(self.root)
-def attachment_name(ref: Path | str) -> str:
-    """
-    Safe name for use with attachment uploads.
-    Mutates a relative path such that it meets Confluence's attachment naming requirements.
-    Allowed characters:
-    * Alphanumeric characters: 0-9, a-z, A-Z
-    * Special characters: hyphen (-), underscore (_), period (.)
-    """
-    if isinstance(ref, Path):
-        path = ref
-    else:
-        path = Path(ref)
-    if path.drive or path.root:
-        raise ValueError(f"required: relative path; got: {ref}")
-    regexp = re.compile(r"[^\-0-9A-Za-z_.]", re.UNICODE)
-    def replace_part(part: str) -> str:
-        if part == "..":
-            return "PAR"
-        else:
-            return regexp.sub("_", part)
-    parts = [replace_part(p) for p in path.parts]
-    return Path(*parts).as_posix().replace("/", "_")

markdown-to-confluence 0.5.2__py3-none-any.whl → 0.5.3__py3-none-any.whl

markdown-to-confluence 0.5.2py3-none-any.whl → 0.5.3py3-none-any.whl