PyPI - markdowndata - Versions diffs - 0.0.5__py3-none-any.whl → 0.1.0__py3-none-any.whl - Mend

markdowndata 0.0.5py3-none-any.whl → 0.1.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (9) hide show

markdowndata/__init__.py CHANGED Viewed

@@ -7,4 +7,4 @@ def loads(text):
 def load(file):
-    return loads(file.read())
+    return loads(file.read())

markdowndata/content_parser.py CHANGED Viewed

@@ -32,17 +32,12 @@ def detect_value_type(text: str) -> str | None:
     return 'md_text'
-def yaml_dict_parser(text: str) -> dict:
+def yaml_parser(text: str) -> dict:
     """
-    Parse YAML from a string (surrounded by ===) and returns it as a dictionary.
-    Assumes YAML is a block at the beginning of the text.
+    Parse YAML from a string (surrounded by ===)
     """
     match = re.search(r'===\s*\n(.*?)\n===', text, re.DOTALL)
-    if match:
-        yaml_data = yaml.safe_load(match.group(1))
-        if yaml_data:
-            return {k: convert_value(v) for k, v in yaml_data.items()}
-    return {}
+    return yaml.safe_load(match.group(1))
 def md_table_parser(text: str) -> list[dict]:
@@ -167,7 +162,7 @@ def parse_content_block(text: str):
         raise ValueError(f'No parser found for content: {text}')
     parser_functions = {
-        'yaml_dict': yaml_dict_parser,
+        'yaml_dict': yaml_parser,
         'md_table': md_table_parser,
         'md_list': md_list_parser,
         'md_text': md_text_parser

markdowndata/process_markdown.py CHANGED Viewed

@@ -1,4 +1,5 @@
 from typing import List
 from .content_parser import parse_content_block
 from .section_tree import split_sections, build_section_tree
 from .utils import Node
@@ -9,6 +10,7 @@ class MarkDataParser:
     Parses a Markdown document into a JSON-like dictionary structure.
     Builds a hierarchy of sections and converts each section's content into a structured form.
     """
     def __init__(self):
         self.data = {}
@@ -29,7 +31,7 @@ class MarkDataParser:
         # Convert the section tree into a JSON-like dictionary structure
         self.data = self.build_dict(section_tree)
-        return self.data
+        return self.data['Root']
     def build_dict(self, sections: List[Node]) -> dict:
         """
@@ -39,12 +41,8 @@ class MarkDataParser:
         for node in sections:
             sub_dict = self.build_dict(node.subsections)
-            if isinstance(node.parsed, dict):
-                # If the parsed content is a dictionary, merge it with its subsections
-                merged = {**node.parsed, **sub_dict}
-            elif node.subsections:
-                # If subsections exist but parsed content is not a dict,
-                # wrap both into a new dictionary
+            if node.subsections:
+                # If subsections exist and there is parsed content wrap both into a new dictionary
                 merged = {
                     'content': node.parsed,
                     **sub_dict
@@ -55,4 +53,5 @@ class MarkDataParser:
             # Use the node's title as the key in the dictionary
             result[node.title] = merged
         return result

markdowndata/section_tree.py CHANGED Viewed

@@ -12,6 +12,17 @@ def split_sections(text: str):
     matches = list(pattern.finditer(text))
     sections = []
+    # First grab anything before the initial header
+    end = matches[0].start() if matches else len(text)
+    sections.append(Section(
+        title="",  # The section's title text
+        level=0,  # The number of # symbols indicates nesting level
+        start=0,  # Position where this header starts in the text
+        end=end,  # Position where this section's content ends
+        content=text[:end].strip()  # The actual text content of this section (excluding header)
+    ))
     for i, match in enumerate(matches):
         # Calculate the 'end' of the current section:
         # It's the start of the next header or the end of the document.
@@ -34,6 +45,12 @@ def build_section_tree(sections):
     Uses a stack to track the current section hierarchy.
     """
     root = Node(title='Root', level=0, parsed={}, subsections=[])
+    # If the initial section is level 0, it makes part of the root
+    if sections[0].level == 0:
+        root.parsed = parse_content_block(sections[0].content)
+        sections.pop(0)
     stack = [root]
     for section in sections:
@@ -55,4 +72,4 @@ def build_section_tree(sections):
         # Push this node to the stack (might have its own children)
         stack.append(node)
-    return root.subsections
+    return [root]

{markdowndata-0.0.5.dist-info → markdowndata-0.1.0.dist-info}/METADATA RENAMED Viewed

@@ -1,8 +1,9 @@
-Metadata-Version: 2.3
+Metadata-Version: 2.4
 Name: markdowndata
-Version: 0.0.5
+Version: 0.1.0
 Summary: Tool to convert markdown tables into json objects
 License: MIT
+License-File: LICENSE
 Author: Gordon Bean
 Author-email: gbean@cs.byu.edu
 Requires-Python: >=3.10,<4.0
@@ -12,6 +13,7 @@ Classifier: Programming Language :: Python :: 3.10
 Classifier: Programming Language :: Python :: 3.11
 Classifier: Programming Language :: Python :: 3.12
 Classifier: Programming Language :: Python :: 3.13
+Classifier: Programming Language :: Python :: 3.14
 Requires-Dist: bs4 (>=0.0.2,<0.0.3)
 Requires-Dist: markdown-it-py (>=3.0.0,<4.0.0)
 Requires-Dist: pyyaml (>=6.0.2,<7.0.0)

markdowndata-0.1.0.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,9 @@
+markdowndata/__init__.py,sha256=jB8leosqIVXuO4LmU0KWn3OyJwgAtGKQBab9JUsbSQ0,172
+markdowndata/content_parser.py,sha256=x0ellHrZn6RZynUzwFGnxdzhS_Y2tL33zzvKrEwBSQc,5157
+markdowndata/process_markdown.py,sha256=jswWDnkApAMoT1gEXe2dfSB2pHt6U3vFuWrh6PgQjBY,1981
+markdowndata/section_tree.py,sha256=gn6PtzXcg4iN7F8Tldy3p3jrWe9IYqrcDEAjNm940ME,2722
+markdowndata/utils.py,sha256=jVTKEGZiLCKdv1cS-73iMf_GaXT6cBc3cl9tp_fjKOw,2040
+markdowndata-0.1.0.dist-info/METADATA,sha256=DIZoJgyceiwDGWp40bNI04xmk8uZExE1tWr8aYCeYEs,706
+markdowndata-0.1.0.dist-info/WHEEL,sha256=zp0Cn7JsFoX2ATtOhtaFYIiE2rmFAD4OcMhtUki8W3U,88
+markdowndata-0.1.0.dist-info/licenses/LICENSE,sha256=K-k1T7XcwAVVmLsHhfWMye6r7p45xz3xwv5S5FBSyZE,1074
+markdowndata-0.1.0.dist-info/RECORD,,

{markdowndata-0.0.5.dist-info → markdowndata-0.1.0.dist-info}/WHEEL RENAMED Viewed

@@ -1,4 +1,4 @@
 Wheel-Version: 1.0
-Generator: poetry-core 2.1.3
+Generator: poetry-core 2.2.1
 Root-Is-Purelib: true
 Tag: py3-none-any

markdowndata-0.0.5.dist-info/RECORD DELETED Viewed

@@ -1,9 +0,0 @@
-markdowndata/__init__.py,sha256=YWWuimxElvXp_jFOYzSAQ7zhtaGU2-jFmKYJq9Mtqp4,171
-markdowndata/content_parser.py,sha256=FdapNfkvCj71K5lUSGQh0H1jS5vF36-l1EImsX28J2o,5387
-markdowndata/process_markdown.py,sha256=ajJBMp2J5ipPUf4r3nxbl2JFdwKWV-82YL79RmWVrDA,2182
-markdowndata/section_tree.py,sha256=X4kPqHCa_2hkiq6roOHUc22G3pNIQjpUv_ni_J14XXQ,2060
-markdowndata/utils.py,sha256=jVTKEGZiLCKdv1cS-73iMf_GaXT6cBc3cl9tp_fjKOw,2040
-markdowndata-0.0.5.dist-info/LICENSE,sha256=K-k1T7XcwAVVmLsHhfWMye6r7p45xz3xwv5S5FBSyZE,1074
-markdowndata-0.0.5.dist-info/METADATA,sha256=4-ewjm9G3G8jmK0eU6DzWlnLtR7XGzxtICghQGj1cDw,633
-markdowndata-0.0.5.dist-info/WHEEL,sha256=b4K_helf-jlQoXBBETfwnf4B04YC67LOev0jo4fX5m8,88
-markdowndata-0.0.5.dist-info/RECORD,,

{markdowndata-0.0.5.dist-info → markdowndata-0.1.0.dist-info/licenses}/LICENSE RENAMED Viewed

File without changes

markdowndata 0.0.5__py3-none-any.whl → 0.1.0__py3-none-any.whl

markdowndata 0.0.5py3-none-any.whl → 0.1.0py3-none-any.whl