PyPI - notionary - Versions diffs - 0.1.2__py3-none-any.whl → 0.1.3__py3-none-any.whl - Mend

notionary 0.1.2py3-none-any.whl → 0.1.3py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (49) hide show

notionary/core/__init__.py +0 -0
notionary/core/converters/__init__.py +50 -0
notionary/core/converters/elements/__init__.py +0 -0
notionary/core/converters/elements/bookmark_element.py +224 -0
notionary/core/converters/elements/callout_element.py +179 -0
notionary/core/converters/elements/code_block_element.py +153 -0
notionary/core/converters/elements/column_element.py +294 -0
notionary/core/converters/elements/divider_element.py +73 -0
notionary/core/converters/elements/heading_element.py +84 -0
notionary/core/converters/elements/image_element.py +130 -0
notionary/core/converters/elements/list_element.py +130 -0
notionary/core/converters/elements/notion_block_element.py +51 -0
notionary/core/converters/elements/paragraph_element.py +73 -0
notionary/core/converters/elements/qoute_element.py +242 -0
notionary/core/converters/elements/table_element.py +306 -0
notionary/core/converters/elements/text_inline_formatter.py +294 -0
notionary/core/converters/elements/todo_lists.py +114 -0
notionary/core/converters/elements/toggle_element.py +205 -0
notionary/core/converters/elements/video_element.py +159 -0
notionary/core/converters/markdown_to_notion_converter.py +482 -0
notionary/core/converters/notion_to_markdown_converter.py +45 -0
notionary/core/converters/registry/__init__.py +0 -0
notionary/core/converters/registry/block_element_registry.py +234 -0
notionary/core/converters/registry/block_element_registry_builder.py +280 -0
notionary/core/database/database_info_service.py +43 -0
notionary/core/database/database_query_service.py +73 -0
notionary/core/database/database_schema_service.py +57 -0
notionary/core/database/models/page_result.py +10 -0
notionary/core/database/notion_database_manager.py +332 -0
notionary/core/database/notion_database_manager_factory.py +233 -0
notionary/core/database/notion_database_schema.py +415 -0
notionary/core/database/notion_database_writer.py +390 -0
notionary/core/database/page_service.py +161 -0
notionary/core/notion_client.py +134 -0
notionary/core/page/meta_data/metadata_editor.py +37 -0
notionary/core/page/notion_page_manager.py +110 -0
notionary/core/page/page_content_manager.py +85 -0
notionary/core/page/property_formatter.py +97 -0
notionary/exceptions/database_exceptions.py +76 -0
notionary/exceptions/page_creation_exception.py +9 -0
notionary/util/logging_mixin.py +47 -0
notionary/util/singleton_decorator.py +20 -0
notionary/util/uuid_utils.py +24 -0
{notionary-0.1.2.dist-info → notionary-0.1.3.dist-info}/METADATA +1 -1
notionary-0.1.3.dist-info/RECORD +49 -0
notionary-0.1.2.dist-info/RECORD +0 -6
{notionary-0.1.2.dist-info → notionary-0.1.3.dist-info}/WHEEL +0 -0
{notionary-0.1.2.dist-info → notionary-0.1.3.dist-info}/licenses/LICENSE +0 -0
{notionary-0.1.2.dist-info → notionary-0.1.3.dist-info}/top_level.txt +0 -0

notionary/core/converters/markdown_to_notion_converter.py ADDED Viewed

@@ -0,0 +1,482 @@
+from typing import Dict, Any, List, Optional, Tuple
+from notionary.core.converters.registry.block_element_registry import (
+    BlockElementRegistry,
+)
+from notionary.core.converters.registry.block_element_registry_builder import (
+    BlockElementRegistryBuilder,
+)
+class MarkdownToNotionConverter:
+    SPACER_MARKER = "<!-- spacer -->"
+    MULTILINE_CONTENT_MARKER = "<!-- REMOVED_MULTILINE_CONTENT -->"
+    TOGGLE_MARKER = "<!-- toggle_content -->"
+    def __init__(self, block_registry: Optional[BlockElementRegistry] = None):
+        """
+        Initialize the MarkdownToNotionConverter.
+        Args:
+            block_registry: Optional registry of Notion block elements
+        """
+        self._block_registry = (
+            block_registry or BlockElementRegistryBuilder().create_standard_registry()
+        )
+        self._setup_element_callbacks()
+    def _setup_element_callbacks(self) -> None:
+        """Registriert den Converter als Callback für Elemente, die ihn benötigen."""
+        for element in self._block_registry.get_elements():
+            if hasattr(element, "set_converter_callback"):
+                element.set_converter_callback(self.convert)
+    def convert(self, markdown_text: str) -> List[Dict[str, Any]]:
+        """
+        Convert markdown text to Notion API block format.
+        Args:
+            markdown_text: The markdown text to convert
+        Returns:
+            List of Notion blocks
+        """
+        if not markdown_text:
+            return []
+        # Process toggles first
+        processed_text, toggle_blocks = self._extract_toggle_elements(markdown_text)
+        # Process other multiline elements
+        processed_text, multiline_blocks = self._extract_multiline_elements(
+            processed_text
+        )
+        # Process remaining text line by line
+        line_blocks = self._process_text_lines(processed_text)
+        # Combine and sort all blocks
+        all_blocks = toggle_blocks + multiline_blocks + line_blocks
+        all_blocks.sort(key=lambda x: x[0])
+        # Extract just the blocks from position tuples
+        blocks = [block for _, _, block in all_blocks]
+        # Process spacing between blocks
+        return self._process_block_spacing(blocks)
+    def _extract_toggle_elements(
+        self, text: str
+    ) -> Tuple[str, List[Tuple[int, int, Dict[str, Any]]]]:
+        """
+        Extract toggle elements and their nested content using the ToggleElement class.
+        Args:
+            text: The text to process
+        Returns:
+            Tuple of (processed text, list of (start_pos, end_pos, block) tuples)
+        """
+        # Find toggle element in registry
+        toggle_element = None
+        for element in self._block_registry.get_elements():
+            if (
+                element.is_multiline()
+                and hasattr(element, "match_markdown")
+                and element.__name__ == "ToggleElement"
+            ):
+                toggle_element = element
+                break
+        if not toggle_element:
+            # No toggle element found, return text as is
+            return text, []
+        # Use the find_matches method of ToggleElement to find and process all toggles
+        # Pass the converter's convert method as a callback to process nested content
+        toggle_blocks = toggle_element.find_matches(text, self.convert)
+        if not toggle_blocks:
+            return text, []
+        # Create a processed text with toggle markers
+        lines = text.split("\n")
+        processed_lines = lines.copy()
+        # Replace toggle content with markers
+        for start_pos, end_pos, _ in reversed(toggle_blocks):
+            # Calculate line indices for this toggle
+            start_line_index = 0
+            current_pos = 0
+            for i, line in enumerate(lines):
+                line_length = len(line) + 1  # +1 for newline
+                if current_pos <= start_pos < current_pos + line_length:
+                    start_line_index = i
+                    break
+                current_pos += line_length
+            end_line_index = start_line_index
+            current_pos = 0
+            for i, line in enumerate(lines):
+                line_length = len(line) + 1  # +1 for newline
+                if current_pos <= end_pos < current_pos + line_length:
+                    end_line_index = i
+                    break
+                current_pos += line_length
+            # Replace toggle content with markers
+            num_lines = end_line_index - start_line_index + 1
+            for i in range(start_line_index, start_line_index + num_lines):
+                processed_lines[i] = self.TOGGLE_MARKER
+        processed_text = "\n".join(processed_lines)
+        return processed_text, toggle_blocks
+    def _extract_multiline_elements(
+        self, text: str
+    ) -> Tuple[str, List[Tuple[int, int, Dict[str, Any]]]]:
+        """
+        Extract multiline elements and remove them from the text.
+        Args:
+            text: The text to process
+        Returns:
+            Tuple of (processed text, list of (start_pos, end_pos, block) tuples)
+        """
+        if not text:
+            return text, []
+        multiline_blocks = []
+        processed_text = text
+        # Get all multiline elements except ToggleElement
+        multiline_elements = [
+            element
+            for element in self._block_registry.get_multiline_elements()
+            if element.__name__ != "ToggleElement"
+        ]
+        if not multiline_elements:
+            return text, []
+        for element in multiline_elements:
+            if not hasattr(element, "find_matches"):
+                continue
+            # Find all matches for this element (pass the convert method as callback if needed)
+            if hasattr(element, "set_converter_callback"):
+                matches = element.find_matches(processed_text, self.convert)
+            else:
+                matches = element.find_matches(processed_text)
+            if not matches:
+                continue
+            multiline_blocks.extend(matches)
+            # Remove matched content from the text to avoid processing it again
+            processed_text = self._replace_matched_content_with_markers(
+                processed_text, matches
+            )
+        return processed_text, multiline_blocks
+    def _replace_matched_content_with_markers(
+        self, text: str, matches: List[Tuple[int, int, Dict[str, Any]]]
+    ) -> str:
+        """Replace matched content with marker placeholders to preserve line structure."""
+        for start, end, _ in reversed(matches):
+            num_newlines = text[start:end].count("\n")
+            text = (
+                text[:start]
+                + "\n"
+                + self.MULTILINE_CONTENT_MARKER
+                + "\n" * num_newlines
+                + text[end:]
+            )
+        return text
+    def _process_text_lines(self, text: str) -> List[Tuple[int, int, Dict[str, Any]]]:
+        """
+        Process text line by line for single-line elements.
+        Args:
+            text: The text to process
+        Returns:
+            List of (start_pos, end_pos, block) tuples
+        """
+        if not text:
+            return []
+        line_blocks = []
+        lines = text.split("\n")
+        current_pos = 0
+        current_paragraph = []
+        paragraph_start = 0
+        in_todo_sequence = False
+        for line in lines:
+            line_length = len(line) + 1  # +1 for newline
+            # Skip marker lines
+            if self._is_marker_line(line):
+                current_pos += line_length
+                continue
+            # Check for spacer marker
+            if self._is_spacer_marker(line):
+                line_blocks.append(
+                    (
+                        current_pos,
+                        current_pos + line_length,
+                        self._create_empty_paragraph(),
+                    )
+                )
+                current_pos += line_length
+                continue
+            # Process todos first to keep them grouped
+            todo_block = self._extract_todo_item(line)
+            if todo_block:
+                self._handle_todo_item(
+                    todo_block,
+                    line_length,
+                    current_pos,
+                    current_paragraph,
+                    paragraph_start,
+                    line_blocks,
+                    in_todo_sequence,
+                )
+                in_todo_sequence = True
+                current_pos += line_length
+                continue
+            if in_todo_sequence:
+                in_todo_sequence = False
+            if not line.strip():
+                self._process_paragraph_if_present(
+                    current_paragraph, paragraph_start, current_pos, line_blocks
+                )
+                current_paragraph = []
+                current_pos += line_length
+                continue
+            special_block = self._extract_special_block(line)
+            if special_block:
+                self._process_paragraph_if_present(
+                    current_paragraph, paragraph_start, current_pos, line_blocks
+                )
+                line_blocks.append(
+                    (current_pos, current_pos + line_length, special_block)
+                )
+                current_paragraph = []
+                current_pos += line_length
+                continue
+            # Handle as part of paragraph
+            if not current_paragraph:
+                paragraph_start = current_pos
+            current_paragraph.append(line)
+            current_pos += line_length
+        # Process any remaining paragraph content
+        self._process_paragraph_if_present(
+            current_paragraph, paragraph_start, current_pos, line_blocks
+        )
+        return line_blocks
+    def _is_marker_line(self, line: str) -> bool:
+        """Check if a line is any kind of marker line that should be skipped."""
+        return self._is_multiline_marker(line) or self._is_toggle_marker(line)
+    def _is_multiline_marker(self, line: str) -> bool:
+        """Check if a line is a multiline content marker."""
+        return line.strip() == self.MULTILINE_CONTENT_MARKER
+    def _is_toggle_marker(self, line: str) -> bool:
+        """Check if a line is a toggle content marker."""
+        return line.strip() == self.TOGGLE_MARKER
+    def _is_spacer_marker(self, line: str) -> bool:
+        """Check if a line is a spacer marker."""
+        return line.strip() == self.SPACER_MARKER
+    def _extract_todo_item(self, line: str) -> Optional[Dict[str, Any]]:
+        """
+        Try to extract a todo item from a line.
+        Returns:
+            Todo block if line is a todo item, None otherwise
+        """
+        for element in self._block_registry.get_elements():
+            if (
+                not element.is_multiline()
+                and hasattr(element, "match_markdown")
+                and element.__name__ == "TodoElement"
+                and element.match_markdown(line)
+            ):
+                return element.markdown_to_notion(line)
+        return None
+    def _handle_todo_item(
+        self,
+        todo_block: Dict[str, Any],
+        line_length: int,
+        current_pos: int,
+        current_paragraph: List[str],
+        paragraph_start: int,
+        line_blocks: List[Tuple[int, int, Dict[str, Any]]],
+        in_todo_sequence: bool,
+    ) -> None:
+        """Handle a todo item line."""
+        # If we were building a paragraph, finish it before starting todos
+        if not in_todo_sequence and current_paragraph:
+            self._process_paragraph_if_present(
+                current_paragraph, paragraph_start, current_pos, line_blocks
+            )
+            current_paragraph.clear()
+        line_blocks.append((current_pos, current_pos + line_length, todo_block))
+    def _extract_special_block(self, line: str) -> Optional[Dict[str, Any]]:
+        """
+        Try to extract a special block (not paragraph) from a line.
+        Returns:
+            Block if line is a special block, None otherwise
+        """
+        for element in self._block_registry.get_elements():
+            if (
+                not element.is_multiline()
+                and hasattr(element, "match_markdown")
+                and element.match_markdown(line)
+            ):
+                block = element.markdown_to_notion(line)
+                if block and block.get("type") != "paragraph":
+                    return block
+        return None
+    def _process_paragraph_if_present(
+        self,
+        paragraph_lines: List[str],
+        start_pos: int,
+        end_pos: int,
+        blocks: List[Tuple[int, int, Dict[str, Any]]],
+    ) -> None:
+        """
+        Process a paragraph and add it to the blocks list if valid.
+        Args:
+            paragraph_lines: Lines that make up the paragraph
+            start_pos: Starting position of the paragraph
+            end_pos: Ending position of the paragraph
+            blocks: List to add the processed paragraph block to
+        """
+        if not paragraph_lines:
+            return
+        paragraph_text = "\n".join(paragraph_lines)
+        block = self._block_registry.markdown_to_notion(paragraph_text)
+        if not block:
+            return
+        blocks.append((start_pos, end_pos, block))
+    def _process_block_spacing(
+        self, blocks: List[Dict[str, Any]]
+    ) -> List[Dict[str, Any]]:
+        """
+        Process blocks and add spacing only where no explicit spacer is present.
+        Args:
+            blocks: List of Notion blocks
+        Returns:
+            List of Notion blocks with processed spacing
+        """
+        if not blocks:
+            return blocks
+        final_blocks = []
+        i = 0
+        while i < len(blocks):
+            current_block = blocks[i]
+            final_blocks.append(current_block)
+            # Check if this is a multiline element that needs spacing
+            if not self._is_multiline_block_type(current_block.get("type")):
+                i += 1
+                continue
+            # Check if the next block is already a spacer
+            if i + 1 < len(blocks) and self._is_empty_paragraph(blocks[i + 1]):
+                # Next block is already a spacer, don't add another
+                pass
+            else:
+                # No explicit spacer found, add one automatically
+                final_blocks.append(self._create_empty_paragraph())
+            i += 1
+        return final_blocks
+    def _is_multiline_block_type(self, block_type: str) -> bool:
+        """
+        Check if a block type corresponds to a multiline element.
+        Args:
+            block_type: The type of block to check
+        Returns:
+            True if the block type is a multiline element, False otherwise
+        """
+        if not block_type:
+            return False
+        multiline_elements = self._block_registry.get_multiline_elements()
+        for element in multiline_elements:
+            element_name = element.__name__.lower()
+            if block_type in element_name:
+                return True
+            if hasattr(element, "match_notion"):
+                dummy_block = {"type": block_type}
+                if element.match_notion(dummy_block):
+                    return True
+        return False
+    def _is_empty_paragraph(self, block: Dict[str, Any]) -> bool:
+        """
+        Check if a block is an empty paragraph.
+        Args:
+            block: The block to check
+        Returns:
+            True if it's an empty paragraph, False otherwise
+        """
+        if block.get("type") != "paragraph":
+            return False
+        rich_text = block.get("paragraph", {}).get("rich_text", [])
+        return not rich_text or len(rich_text) == 0
+    def _create_empty_paragraph(self) -> Dict[str, Any]:
+        """
+        Create an empty paragraph block.
+        Returns:
+            Empty paragraph block dictionary
+        """
+        return {"type": "paragraph", "paragraph": {"rich_text": []}}

notionary/core/converters/notion_to_markdown_converter.py ADDED Viewed

@@ -0,0 +1,45 @@
+from typing import Dict, Any, List, Optional
+from notionary.core.converters.registry.block_element_registry import (
+    BlockElementRegistry,
+)
+from notionary.core.converters.registry.block_element_registry_builder import (
+    BlockElementRegistryBuilder,
+)
+class NotionToMarkdownConverter:
+    """Converts Notion blocks to Markdown text."""
+    def __init__(self, block_registry: Optional[BlockElementRegistry] = None):
+        """
+        Initialize the MarkdownToNotionConverter.
+        Args:
+            block_registry: Optional registry of Notion block elements
+        """
+        self._block_registry = (
+            block_registry or BlockElementRegistryBuilder().create_standard_registry()
+        )
+    def convert(self, blocks: List[Dict[str, Any]]) -> str:
+        """
+        Convert Notion blocks to Markdown text.
+        Args:
+            blocks: List of Notion blocks
+        Returns:
+            Markdown text
+        """
+        if not blocks:
+            return ""
+        markdown_parts = []
+        for block in blocks:
+            markdown = self._block_registry.notion_to_markdown(block)
+            if markdown:
+                markdown_parts.append(markdown)
+        return "\n\n".join(markdown_parts)

notionary/core/converters/registry/__init__.py ADDED Viewed

File without changes

notionary 0.1.2__py3-none-any.whl → 0.1.3__py3-none-any.whl

notionary 0.1.2py3-none-any.whl → 0.1.3py3-none-any.whl