PyPI - chatgpt-md-converter - Versions diffs - 0.3.9__tar.gz → 0.3.11__tar.gz - Mend

chatgpt-md-converter 0.3.9tar.gz → 0.3.11tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (28) hide show

{chatgpt_md_converter-0.3.9 → chatgpt_md_converter-0.3.11}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: chatgpt_md_converter
-Version: 0.3.9
+Version: 0.3.11
 Summary: A package for converting markdown to HTML for chat Telegram bots
 Home-page: https://github.com/botfather-dev/formatter-chatgpt-telegram
 Author: Kostiantyn Kriuchkov

{chatgpt_md_converter-0.3.9 → chatgpt_md_converter-0.3.11}/chatgpt_md_converter/html_markdown/handlers.py RENAMED Viewed

@@ -35,30 +35,91 @@ def render_node(node: Node, state: RenderState) -> str:
     return render_nodes(node.children, state)
+def _split_surrounding_whitespace(text: str) -> tuple[str, str, str]:
+    """Return leading whitespace, core text, and trailing whitespace."""
+    start = 0
+    end = len(text)
+    while start < end and text[start].isspace():
+        start += 1
+    while end > start and text[end - 1].isspace():
+        end -= 1
+    return text[:start], text[start:end], text[end:]
+def _italic_boundary_conflict(marker: str, core: str) -> bool:
+    if marker == "*":
+        return core.startswith("*") or core.endswith("*")
+    if marker == "_":
+        starts = core.startswith("_")
+        if starts and len(core) > 1 and core[1] == "_":
+            starts = False
+        ends = core.endswith("_")
+        if ends and len(core) > 1 and core[-2] == "_":
+            ends = False
+        return starts or ends
+    return False
+def _choose_italic_marker(state: RenderState, core: str) -> str:
+    depth = state.italic_depth
+    if state.bold_depth > 0 and depth == 0:
+        candidates = ["_", "*"]
+    elif depth % 2 == 0:
+        candidates = ["*", "_"]
+    else:
+        candidates = ["_", "*"]
+    for marker in candidates:
+        if not _italic_boundary_conflict(marker, core):
+            return marker
+    return candidates[0]
 def _handle_bold(node: Node, state: RenderState) -> str:
     inner_state = state.child(bold_depth=state.bold_depth + 1)
     inner = render_nodes(node.children, inner_state)
-    return f"**{inner}**"
+    leading, core, trailing = _split_surrounding_whitespace(inner)
+    if not core:
+        return leading + trailing
+    return f"{leading}**{core}**{trailing}"
 def _handle_italic(node: Node, state: RenderState) -> str:
     depth = state.italic_depth
-    in_bold = state.bold_depth > 0 and depth == 0
-    marker = "_" if in_bold else ("*" if depth % 2 == 0 else "_")
     inner_state = state.child(italic_depth=depth + 1)
     inner = render_nodes(node.children, inner_state)
-    return f"{marker}{inner}{marker}"
+    leading, core, trailing = _split_surrounding_whitespace(inner)
+    if not core:
+        return leading + trailing
+    marker = _choose_italic_marker(state, core)
+    return f"{leading}{marker}{core}{marker}{trailing}"
 def _handle_inline_marker(node: Node, state: RenderState) -> str:
     marker_open, marker_close = _INLINE_MARKERS[node.tag.lower()]
     inner = render_nodes(node.children, state)
-    return f"{marker_open}{inner}{marker_close}"
+    leading, core, trailing = _split_surrounding_whitespace(inner)
+    if not core:
+        return leading + trailing
+    return f"{leading}{marker_open}{core}{marker_close}{trailing}"
 def _handle_spoiler(node: Node, state: RenderState) -> str:
     inner = render_nodes(node.children, state)
-    return f"||{inner}||"
+    leading, core, trailing = _split_surrounding_whitespace(inner)
+    if not core:
+        return leading + trailing
+    return f"{leading}||{core}||{trailing}"
 def _handle_code(node: Node, state: RenderState) -> str:

{chatgpt_md_converter-0.3.9 → chatgpt_md_converter-0.3.11}/chatgpt_md_converter/telegram_markdown/code_blocks.py RENAMED Viewed

@@ -67,7 +67,7 @@ def extract_and_convert_code_blocks(text: str):
             .replace("<", "&lt;")
             .replace(">", "&gt;")
         )
-        placeholder = f"CODEBLOCKPLACEHOLDER{len(placeholders)}"
+        placeholder = f"CODEBLOCKPLACEHOLDER_{len(placeholders)}_"
         placeholders.append(placeholder)
         if language:
             html_block = f'<pre><code class="language-{language}">{escaped}</code></pre>'

{chatgpt_md_converter-0.3.9 → chatgpt_md_converter-0.3.11}/chatgpt_md_converter/telegram_markdown/inline.py RENAMED Viewed

@@ -60,7 +60,7 @@ def extract_inline_code_snippets(text: str):
     def replacer(match: re.Match[str]) -> str:
         snippet = match.group(1)
-        placeholder = f"INLINECODEPLACEHOLDER{len(placeholders)}"
+        placeholder = f"INLINECODEPLACEHOLDER_{len(placeholders)}_"
         placeholders.append(placeholder)
         snippets[placeholder] = snippet
         return placeholder

{chatgpt_md_converter-0.3.9 → chatgpt_md_converter-0.3.11}/chatgpt_md_converter.egg-info/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: chatgpt_md_converter
-Version: 0.3.9
+Version: 0.3.11
 Summary: A package for converting markdown to HTML for chat Telegram bots
 Home-page: https://github.com/botfather-dev/formatter-chatgpt-telegram
 Author: Kostiantyn Kriuchkov

{chatgpt_md_converter-0.3.9 → chatgpt_md_converter-0.3.11}/chatgpt_md_converter.egg-info/SOURCES.txt RENAMED Viewed

@@ -20,6 +20,7 @@ chatgpt_md_converter/telegram_markdown/inline.py
 chatgpt_md_converter/telegram_markdown/postprocess.py
 chatgpt_md_converter/telegram_markdown/preprocess.py
 chatgpt_md_converter/telegram_markdown/renderer.py
+tests/test_html_to_markdown_inline_spacing.py
 tests/test_parser.py
 tests/test_roundtrip_markdown.py
 tests/test_splitter.py

{chatgpt_md_converter-0.3.9 → chatgpt_md_converter-0.3.11}/setup.py RENAMED Viewed

@@ -2,7 +2,7 @@ from setuptools import setup
 setup(
     name="chatgpt_md_converter",
-    version="0.3.9",
+    version="0.3.11",
     author="Kostiantyn Kriuchkov",
     author_email="latand666@gmail.com",
     description="A package for converting markdown to HTML for chat Telegram bots",

chatgpt_md_converter-0.3.11/tests/test_html_to_markdown_inline_spacing.py ADDED Viewed

@@ -0,0 +1,25 @@
+import pytest
+from chatgpt_md_converter import html_to_telegram_markdown
+@pytest.mark.parametrize(
+    ("html", "expected"),
+    [
+        ("Start <b>bold </b>finish", "Start **bold** finish"),
+        ("Start <b> bold</b> finish", "Start  **bold** finish"),
+        ("Start <i> italics </i>finish", "Start  _italics_ finish"),
+        ("Start <i>value_</i>end", "Start *value_*end"),
+        ("Start <u> underline </u>finish", "Start  __underline__ finish"),
+        (
+            "Start <span class=\"tg-spoiler\"> secret </span>end",
+            "Start  ||secret|| end",
+        ),
+        (
+            "Intro <b>bold <i> inner </i> block</b> outro",
+            "Intro **bold  _inner_  block** outro",
+        ),
+    ],
+)
+def test_html_to_markdown_strips_inline_whitespace(html: str, expected: str) -> None:
+    assert html_to_telegram_markdown(html) == expected

{chatgpt_md_converter-0.3.9 → chatgpt_md_converter-0.3.11}/tests/test_parser.py RENAMED Viewed

@@ -800,6 +800,66 @@ print("hello world ```")
     assert output == expected_output, show_output()
+def test_inline_code_placeholders_do_not_overlap():
+    input_text = """Службова нотатка для тесту.
+Коли ви запускаєте `alpha.run()`, система піднімає локальний клієнт.
+У модулі використовується `hook.set()` для реєстрації синхронізації.
+```python
+from framework import hook
+async def configure(base_url: str):
+    await hook.set(f"{base_url}/sync")
+```
+**Покроковий план**
+1.  Викликаємо `hook.set()` через менеджер потоків.
+2.  `hook.set()` повертає попередження при повторній реєстрації.
+3.  Якщо потрібно, `hook.clear()` знімає прив'язку.
+4.  Використовуємо `core.loop()` для довготривалих з'єднань.
+5.  `hook.set()` запускає фонову синхронізацію.
+Поточне середовище потребує **TLS**. Для локального доступу підходить `debug.tunnel`.
+Чи є питання щодо `hook.set()` чи `hook.clear()`?"""
+    expected_output = """Службова нотатка для тесту.
+Коли ви запускаєте <code>alpha.run()</code>, система піднімає локальний клієнт.
+У модулі використовується <code>hook.set()</code> для реєстрації синхронізації.
+<pre><code class="language-python">from framework import hook
+async def configure(base_url: str):
+    await hook.set(f"{base_url}/sync")
+</code></pre>
+<b>Покроковий план</b>
+1.  Викликаємо <code>hook.set()</code> через менеджер потоків.
+2.  <code>hook.set()</code> повертає попередження при повторній реєстрації.
+3.  Якщо потрібно, <code>hook.clear()</code> знімає прив'язку.
+4.  Використовуємо <code>core.loop()</code> для довготривалих з'єднань.
+5.  <code>hook.set()</code> запускає фонову синхронізацію.
+Поточне середовище потребує <b>TLS</b>. Для локального доступу підходить <code>debug.tunnel</code>.
+Чи є питання щодо <code>hook.set()</code> чи <code>hook.clear()</code>?"""
+    output = telegram_format(input_text)
+    assert output == expected_output
+    assert "<code>hook.set()</code>0" not in output
+    assert "<code>hook.set()</code>1" not in output
+    assert "<code>hook.set()</code>2" not in output
+    assert "<code>hook.set()</code>3" not in output
+    assert "<code>hook.set()</code>4" not in output
 def test_nested_code_fence_six_backticks():
     input_text = """``````markdown
 `````python