PyPI - markdown_convert - Versions diffs - 1.2.51__py3-none-any.whl → 1.2.52__py3-none-any.whl - Mend

markdown_convert 1.2.51py3-none-any.whl → 1.2.52py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (8) hide show

markdown_convert/default.css CHANGED Viewed

@@ -453,14 +453,6 @@ math {
   border-radius: 0.3rem;
 }
-.admonition header {
-  display: flex;
-  align-items: center;
-  gap: 0.25rem;
-  margin-bottom: 0.25rem;
-  font-weight: bold;
-}
 .admonition strong {
   text-transform: capitalize;
 }
@@ -522,4 +514,14 @@ math {
 .admonition.caution strong {
   color: var(--color-ad-caution);
+}
+/* Vega-Lite charts*/
+.vega-lite {
+  display: flex;
+  justify-content: center;
+  align-items: center;
+  width: 100%;
+  margin-top: 1em;
+  margin-bottom: 1em;
 }

markdown_convert/modules/extras.py CHANGED Viewed

@@ -3,98 +3,221 @@ Extras are defined as helper functions called by
 render_extra_features from transform.py
 """
+import vl_convert as vlc
+from ruamel.yaml import YAML
+from bs4 import Tag, BeautifulSoup
+import re
-def create_checkbox(soup, match):
+class ExtraFeature:
     """
-    Render a tag for a checkbox.
+    Base class for extra features that can be applied to HTML.
-    Args:
-        soup: HTML beautifulsoup
-        match: Element identified as a checkbox
-    Returns:
-        tag: Beautifulsoup tag representing the checkbox
+    Attributes:
+        pattern (str): Regex pattern to match the extra feature in the HTML.
+        run_before_stash (bool): Whether to run this extra before stashing code blocks.
     """
-    tag = soup.new_tag("input", type="checkbox")
-    if "[x]" in match.group("checkbox"):
-        tag["checked"] = ""
-    return tag
+    pattern = r""
+    run_before_stash = False
-def create_highlight(soup, match):
-    """
-    Render a tag for a highlight.
+    def replace(self, match, html):
+        """
+        Replaces the matched pattern with the rendered extra feature.
-    Args:
-        soup: HTML beautifulsoup
-        match: Element identified as a highlight
-    Returns:
-        tag: Beautifulsoup tag representing the highlight
+        Args:
+            match (re.Match): The regex match object.
+            html (str): The full HTML content.
+        Returns:
+            str: The replacement string.
+        Raises:
+            NotImplementedError: If the subclass does not implement this method.
+        """
+        raise NotImplementedError("Subclasses must implement the replace method.")
+class CheckboxExtra(ExtraFeature):
+    """
+    Extra feature for rendering checkboxes.
     """
-    tag = soup.new_tag("span", attrs={"class": "highlight"})
-    tag.string = match.group("hl_content")
-    return tag
+    pattern = r"(?P<checkbox>\[\s\]|\[x\])"
+    def replace(match, html):
+        """
+        Render a tag for a checkbox.
+        Args:
+            match: Element identified as a checkbox
+        Returns:
+            str: tag representing the checkbox
+        """
+        status = "checked" if "[x]" in match.group("checkbox") else ""
+        return f'<input type="checkbox" {status}>'
-def create_custom_span(soup, match):
+class HighlightExtra(ExtraFeature):
+    """
+    Extra feature for rendering highlighted text.
     """
-    Render a tag for a custom span.
-    Args:
-        soup: HTML beautifulsoup
-        match: Element identified as a custom span
-    Returns:
-        tag: Beautifulsoup tag representing the custom span
+    pattern = r"==(?P<content>.*?)=="
+    def replace(match, html):
+        """
+        Render a tag for a highlight.
+        Args:
+            match: Element identified as a highlight
+        Returns:
+            str: tag representing the highlight
+        """
+        content = match.group("content")
+        return f'<span class="highlight">{content}</span>'
+class CustomSpanExtra(ExtraFeature):
     """
-    tag = soup.new_tag("span", attrs={"class": match.group("cls")})
-    tag.string = match.group("sp_content")
-    return tag
+    Extra feature for rendering custom spans with specific classes.
+    """
+    pattern = r"(?P<cls>[a-zA-Z0-9_-]+)\{\{\s*(?P<content>.*?)\s*\}\}"
+    def replace(match, html):
+        """
+        Render a tag for a custom span.
-def create_toc(soup, match):
+        Args:
+            match: Element identified as a custom span
+        Returns:
+            str: tag representing the custom span
+        """
+        cls = match.group("cls")
+        content = match.group("content")
+        return f'<span class="{cls}">{content}</span>'
+class TocExtra(ExtraFeature):
+    """
+    Extra feature for rendering a Table of Contents.
     """
-    Render a tag for a table of contents
+    pattern = r"\[TOC(?:\s+depth=(?P<depth>\d+))?\]"
+    def replace(match, html):
+        """
+        Render a tag for a table of contents
+        Args:
+            match: Element identified as a table of contents
+        Returns:
+            str: tag representing the table of contents
+        """
+        soup = BeautifulSoup(html, "html.parser")
+        max_level = match.group("depth")
+        max_level = 3 if max_level is None else int(max_level)
+        headers = [
+            header
+            for header in soup.find_all(
+                [f"h{index}" for index in range(1, max_level + 1)]
+            )
+            if header.get("id")
+        ]
+        if not headers:
+            return ""
+        tag: Tag = soup.new_tag("ul", attrs={"class": "toc"})
+        active_list = {0: tag}
+        last_list_element = {}
+        for header in headers:
+            level = int(header.name[1])
+            if level not in active_list:
+                parent_lvl = max(key for key in active_list if key < level)
+                if last_list_element.get(parent_lvl):
+                    sub_list = soup.new_tag("ul")
+                    last_list_element[parent_lvl].append(sub_list)
+                    active_list[level] = sub_list
+                else:
+                    active_list[level] = active_list[parent_lvl]
+            active_list = {
+                key: value for key, value in active_list.items() if key <= level
+            }
+            list_item = soup.new_tag("li")
+            link = soup.new_tag("a", href=f"#{header['id']}")
+            link.string = header.get_text(strip=True)
+            list_item.append(link)
+            active_list[level].append(list_item)
+            last_list_element[level] = list_item
+        return tag.prettify()
+class VegaExtra(ExtraFeature):
+    """
+    Extra feature for rendering Vega-Lite diagrams from YAML.
+    """
+    pattern = r"(?s)<pre><code>\$schema: https://vega\.github\.io(?P<content>.*?)</code></pre>"
+    run_before_stash = True
+    def replace(match, html):
+        """
+        Render a tag for a vega lite diagram YAML.
+        Args:
+            match (re.Match): Element identified as a vega lite diagram YAML.
+            html (str): The full HTML content.
+        Returns:
+            str: SVG tag representing the vega lite diagram.
+        """
+        schema_line = "$schema: https://vega.github.io"
+        yaml = YAML()
+        spec = yaml.load(schema_line + match.group("content"))
+        tag = vlc.vegalite_to_svg(spec)
+        return f"<div class='vega-lite'>{tag}</div>"
+def apply_extras(extras: set[ExtraFeature], html, before_stash=False):
+    """
+    Applies extra features to an html string.
     Args:
-        soup: HTML beautifulsoup
-        match: Element identified as a table of contents
+        extras: set[ExtraFeature] Extra features to apply
+        html: complete html text, used by some extras like TOC.
     Returns:
-        tag: Beautifulsoup tag representing the table of contents
+        str: The updated html.
     """
-    max_level = match.group("depth")
-    max_level = 3 if max_level is None else int(max_level)
-    headers = [
-        header
-        for header in soup.find_all([f"h{index}" for index in range(1, max_level + 1)])
-        if header.get("id")
-    ]
-    if not headers:
-        return ""
-    tag = soup.new_tag("ul", attrs={"class": "toc"})
-    active_list = {0: tag}
-    last_list_element = {}
-    for header in headers:
-        level = int(header.name[1])
-        if level not in active_list:
-            parent_lvl = max(key for key in active_list if key < level)
-            if last_list_element.get(parent_lvl):
-                sub_list = soup.new_tag("ul")
-                last_list_element[parent_lvl].append(sub_list)
-                active_list[level] = sub_list
-            else:
-                active_list[level] = active_list[parent_lvl]
-        active_list = {key: value for key, value in active_list.items() if key <= level}
-        list_item = soup.new_tag("li")
-        link = soup.new_tag("a", href=f"#{header['id']}")
-        link.string = header.get_text(strip=True)
-        list_item.append(link)
-        active_list[level].append(list_item)
-        last_list_element[level] = list_item
-    return tag
+    for extra in extras:
+        if not extra.run_before_stash == before_stash:
+            continue
+        # Loop until the pattern no longer matches
+        while re.search(extra.pattern, html, flags=re.DOTALL):
+            new_html = html
+            try:
+                new_html = re.sub(
+                    extra.pattern,
+                    lambda match: extra.replace(match, html=html),
+                    html,
+                    flags=re.DOTALL,
+                )
+            except Exception as exc:
+                print(
+                    f"WARNING: An exception occurred while trying to apply an extra:\n{exc}"
+                )
+                pass
+            # Safety break:
+            if new_html == html:
+                break
+            html = new_html
+    return html

markdown_convert/modules/transform.py CHANGED Viewed

@@ -6,9 +6,15 @@ import re
 from bs4 import BeautifulSoup
-from .constants import YELLOW
-from .extras import create_checkbox, create_custom_span, create_highlight, create_toc
-from .utils import color
+from .extras import (
+    apply_extras,
+    ExtraFeature,
+    CheckboxExtra,
+    CustomSpanExtra,
+    HighlightExtra,
+    TocExtra,
+    VegaExtra,
+)
 def create_html_document(html_content, css_content, csp):
@@ -89,76 +95,41 @@ def render_mermaid_diagrams(html, *, nonce):
     return html
-def render_extra_features(html):
+def render_extra_features(
+    html,
+    extras: set[ExtraFeature] = (
+        CheckboxExtra,
+        CustomSpanExtra,
+        HighlightExtra,
+        TocExtra,
+        VegaExtra,
+    ),
+):
     """
-    Renders extra features like checkboxes, highlights, and custom spans in the HTML content.
-    Args:
-        html (str): HTML content.
-    Returns:
-        str: HTML content with extra features rendered.
+    Renders extra features by protecting specific tags, applying regex
+    transformations, and restoring the protected content.
     """
+    placeholders = {}
+    def stash(match):
+        key = f"__PROTECTED_BLOCK_{len(placeholders)}__"
+        placeholders[key] = match.group(0)
+        return key
-    handlers = {
-        "checkbox": create_checkbox,
-        "highlight": create_highlight,
-        "span": create_custom_span,
-        "toc": create_toc,
-    }
-    master_pattern = re.compile(
-        r"(?P<checkbox>\[\s\]|\[x\])|"
-        r"(?P<highlight>==(?P<hl_content>.*?)==)|"
-        r"(?P<span>(?P<cls>[a-zA-Z0-9_-]+)\{\{\s*(?P<sp_content>.*?)\s*\}\})|"
-        r"(?P<toc>\[TOC(?:\s+depth=(?P<depth>\d+))?\])"
+    # 0. Pre protection extras
+    html = apply_extras(extras, html, before_stash=True)
+    # 1. Protection: Replace ignored tags with unique hashes
+    ignored_pattern = re.compile(
+        r"<(code|pre|script|style)\b[^>]*>.*?</\1>", re.DOTALL | re.IGNORECASE
     )
+    html = ignored_pattern.sub(stash, html)
-    ignored_tags = {"code", "pre", "script", "style"}
-    soup = BeautifulSoup(html, "html.parser")
-    for text_node in soup.find_all(string=True):
-        # Ignore text nodes within certain tags
-        if text_node.parent.name in ignored_tags:
-            continue
-        # If no match, skip processing
-        content = text_node.string
-        if not master_pattern.search(content):
-            continue
-        new_nodes = []
-        last_end = 0
-        for match in master_pattern.finditer(content):
-            start, end = match.span()
-            # Append text before the match
-            if start > last_end:
-                new_nodes.append(content[last_end:start])
-            kind = match.lastgroup
-            # Call the appropriate handler
-            handler = handlers.get(kind)
-            if handler:
-                try:
-                    tag = handler(soup, match)
-                    new_nodes.append(tag)
-                except Exception as exc:
-                    print(
-                        color(
-                            YELLOW,
-                            f"WARNING: Handler for '{kind}' failed with exception: {exc}",
-                        )
-                    )
-                    new_nodes.append(match.group(0))
-            last_end = end
-        # Append any remaining text after the last match
-        if new_nodes:
-            if last_end < len(content):
-                new_nodes.append(content[last_end:])
-            text_node.replace_with(*new_nodes)
+    # 2. Transformations: Define patterns and their replacements
+    html = apply_extras(extras, html, before_stash=False)
-    return str(soup)
+    # 3. Restoration: Replace hashes back with original content
+    for key, original_content in placeholders.items():
+        html = html.replace(key, original_content)
+    return html

{markdown_convert-1.2.51.dist-info → markdown_convert-1.2.52.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: markdown_convert
-Version: 1.2.51
+Version: 1.2.52
 Summary: Convert Markdown files to PDF from your command line.
 Project-URL: homepage, https://github.com/Julynx/markdown_convert
 Author-email: Julio Cabria <juliocabria@tutanota.com>
@@ -17,6 +17,8 @@ Requires-Dist: latex2mathml>=3.78.1
 Requires-Dist: markdown2<3,>=2.4.13
 Requires-Dist: playwright>=1.57.0
 Requires-Dist: pygments<3,>=2.17.2
+Requires-Dist: ruamel-yaml>=0.19.1
+Requires-Dist: vl-convert-python>=1.9.0.post1
 Description-Content-Type: text/markdown
 # markdown-convert

{markdown_convert-1.2.51.dist-info → markdown_convert-1.2.52.dist-info}/RECORD RENAMED Viewed

@@ -1,18 +1,18 @@
 markdown_convert/__init__.py,sha256=0hLMtJnCIuApqopx5P4tiDSw850AmnuVcohmAbPVEZ4,303
 markdown_convert/__main__.py,sha256=AocRo1iF1El_-Uo0owJ-QLbJUF0rum5R_AlNrTTTSOQ,2780
 markdown_convert/code.css,sha256=Wt4FqFqJcpT-jwY3GN-o4ZRCCXU8DQj-9lqKdGiuoyw,4935
-markdown_convert/default.css,sha256=XmIR6Kx4evwmLTZr9QZc3XhDj4jxjmGkwaeftfvHNmU,8149
+markdown_convert/default.css,sha256=2Aac379NfFgytk8Gwnh4kNFN3FMNYmpxxNvoATg1How,8183
 markdown_convert/modules/__init__.py,sha256=PFPgiQhMXgyfjD8BkfLC_X8AR1jz-dCxfif2qmNofJs,65
 markdown_convert/modules/autoinstall.py,sha256=Tnrde6MIcO11PWT7GZwhs_QTVRy6CSpUB_gIi9G5ve8,2063
 markdown_convert/modules/constants.py,sha256=FA8DrQa9nzTUIJFXwXrK-AuOc5_ToGSFaD4sJqsnAjU,1305
 markdown_convert/modules/convert.py,sha256=1AjQfnOXJoxKyfqr4misDuTvE4YXnwaoWw668FUHiEQ,8972
-markdown_convert/modules/extras.py,sha256=GwNx6nseztHOWExcYmovxomdvOs078dMeknQTwzTCJo,2730
+markdown_convert/modules/extras.py,sha256=GO-Nk5hCWsdcPggL2-Mv9Q31wFWLLWyNK_xhXUEOs9g,6313
 markdown_convert/modules/resources.py,sha256=eskLLbrkLJWs-vqtCLq4qV2Hjy6XeGFCUdT0VN2b_tA,2488
-markdown_convert/modules/transform.py,sha256=e4QllWx5BYKEQqIzOkYigtxcSAWqSUHsoKkvqzYzEpY,4567
+markdown_convert/modules/transform.py,sha256=9_0mqeHwKPECr3Ft1z8r14flTOw4Y8dxblsOIfblEGw,3476
 markdown_convert/modules/utils.py,sha256=NX0WegM8e8MPKNNmweTujAWO8ZghdB8LSGDx20K2E44,655
 markdown_convert/modules/validate.py,sha256=XV_k7cHeifEKDaltF26tCmabs2-Me5msP3enI_eVwfA,1517
-markdown_convert-1.2.51.dist-info/METADATA,sha256=sejp1Y3EzxGpfMqDxIJsieDaxkO9_o0gFffs7ULpwKw,4118
-markdown_convert-1.2.51.dist-info/WHEEL,sha256=WLgqFyCfm_KASv4WHyYy0P3pM_m7J5L9k2skdKLirC8,87
-markdown_convert-1.2.51.dist-info/entry_points.txt,sha256=RCmzC7C0sX-SpzIP2Cr34rhg3lMd7BRx-exaZPfK8bU,68
-markdown_convert-1.2.51.dist-info/licenses/LICENSE,sha256=gXf5dRMhNSbfLPYYTY_5hsZ1r7UU1OaKQEAQUhuIBkM,18092
-markdown_convert-1.2.51.dist-info/RECORD,,
+markdown_convert-1.2.52.dist-info/METADATA,sha256=d7J5oijwQL3Z23RLFgxGMMFh_-jjVIsP2evst7LqK5w,4199
+markdown_convert-1.2.52.dist-info/WHEEL,sha256=WLgqFyCfm_KASv4WHyYy0P3pM_m7J5L9k2skdKLirC8,87
+markdown_convert-1.2.52.dist-info/entry_points.txt,sha256=RCmzC7C0sX-SpzIP2Cr34rhg3lMd7BRx-exaZPfK8bU,68
+markdown_convert-1.2.52.dist-info/licenses/LICENSE,sha256=gXf5dRMhNSbfLPYYTY_5hsZ1r7UU1OaKQEAQUhuIBkM,18092
+markdown_convert-1.2.52.dist-info/RECORD,,

{markdown_convert-1.2.51.dist-info → markdown_convert-1.2.52.dist-info}/WHEEL RENAMED Viewed

File without changes

{markdown_convert-1.2.51.dist-info → markdown_convert-1.2.52.dist-info}/entry_points.txt RENAMED Viewed

File without changes

{markdown_convert-1.2.51.dist-info → markdown_convert-1.2.52.dist-info}/licenses/LICENSE RENAMED Viewed

File without changes

markdown_convert 1.2.51__py3-none-any.whl → 1.2.52__py3-none-any.whl

markdown_convert 1.2.51py3-none-any.whl → 1.2.52py3-none-any.whl