PyPI - ssmd - Versions diffs - 0.5.3__py3-none-any.whl - Mend

ssmd 0.5.3__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (20) hide show

ssmd/__init__.py +189 -0
ssmd/_version.py +34 -0
ssmd/capabilities.py +277 -0
ssmd/document.py +918 -0
ssmd/formatter.py +244 -0
ssmd/parser.py +1049 -0
ssmd/parser_types.py +41 -0
ssmd/py.typed +0 -0
ssmd/segment.py +720 -0
ssmd/sentence.py +270 -0
ssmd/ssml_conversions.py +124 -0
ssmd/ssml_parser.py +599 -0
ssmd/types.py +122 -0
ssmd/utils.py +333 -0
ssmd/xsampa_to_ipa.txt +174 -0
ssmd-0.5.3.dist-info/METADATA +1210 -0
ssmd-0.5.3.dist-info/RECORD +20 -0
ssmd-0.5.3.dist-info/WHEEL +5 -0
ssmd-0.5.3.dist-info/licenses/LICENSE +21 -0
ssmd-0.5.3.dist-info/top_level.txt +1 -0

ssmd/__init__.py ADDED Viewed

@@ -0,0 +1,189 @@
+"""SSMD - Speech Synthesis Markdown to SSML converter.
+SSMD provides a lightweight markdown-like syntax for creating SSML
+(Speech Synthesis Markup Language) documents. It's designed to be
+more human-friendly than raw SSML while maintaining full compatibility.
+Example:
+    Basic usage::
+        import ssmd
+        # Create and build a document
+        doc = ssmd.Document()
+        doc.add_sentence("Hello *world*!")
+        doc.add_sentence("This is SSMD.")
+        # Export to different formats
+        ssml = doc.to_ssml()
+        text = doc.to_text()
+        # Or use convenience functions for one-off conversions
+        ssml = ssmd.to_ssml("Hello *world*!")
+    Advanced usage with streaming::
+        # Create parser with custom config
+        doc = ssmd.Document(
+            capabilities='pyttsx3',
+            config={'auto_sentence_tags': True}
+        )
+        # Build document incrementally
+        doc.add_paragraph("# Welcome")
+        doc.add_sentence("Hello and *welcome* to SSMD!")
+        # Stream to TTS
+        for sentence in doc.sentences():
+            tts_engine.speak(sentence)
+"""
+from typing import Any
+from ssmd.document import Document
+from ssmd.ssml_parser import SSMLParser
+from ssmd.capabilities import (
+    TTSCapabilities,
+    get_preset,
+    ESPEAK_CAPABILITIES,
+    PYTTSX3_CAPABILITIES,
+    GOOGLE_TTS_CAPABILITIES,
+    AMAZON_POLLY_CAPABILITIES,
+    AZURE_TTS_CAPABILITIES,
+    MINIMAL_CAPABILITIES,
+    FULL_CAPABILITIES,
+)
+from ssmd.parser import (
+    parse_sentences,
+    parse_segments,
+    parse_voice_blocks,
+)
+from ssmd.parser_types import (
+    SSMDSegment,
+    SSMDSentence,
+    VoiceAttrs,
+    ProsodyAttrs,
+    BreakAttrs,
+    SayAsAttrs,
+    AudioAttrs,
+    PhonemeAttrs,
+)
+from ssmd.segment import Segment
+from ssmd.sentence import Sentence
+from ssmd.types import (
+    HeadingConfig,
+    DEFAULT_HEADING_LEVELS,
+)
+from ssmd.formatter import format_ssmd
+from ssmd.utils import escape_ssmd_syntax, unescape_ssmd_syntax
+try:
+    from ssmd._version import version as __version__
+except ImportError:
+    __version__ = "unknown"
+# ═══════════════════════════════════════════════════════════
+# CONVENIENCE FUNCTIONS
+# ═══════════════════════════════════════════════════════════
+def to_ssml(ssmd_text: str, **config: Any) -> str:
+    """Convert SSMD to SSML (convenience function).
+    Creates a temporary Document and converts to SSML.
+    For repeated conversions with the same config, create a Document instance.
+    Args:
+        ssmd_text: SSMD markdown text
+        **config: Optional configuration parameters
+    Returns:
+        SSML string
+    Example:
+        >>> ssmd.to_ssml("Hello *world*!")
+        '<speak>Hello <emphasis>world</emphasis>!</speak>'
+    """
+    return Document(ssmd_text, config).to_ssml()
+def to_text(ssmd_text: str, **config: Any) -> str:
+    """Convert SSMD to plain text (convenience function).
+    Strips all SSMD markup, returning plain text.
+    Args:
+        ssmd_text: SSMD markdown text
+        **config: Optional configuration parameters
+    Returns:
+        Plain text with markup removed
+    Example:
+        >>> ssmd.to_text("Hello *world* @marker!")
+        'Hello world!'
+    """
+    return Document(ssmd_text, config).to_text()
+def from_ssml(ssml_text: str, **config: Any) -> str:
+    """Convert SSML to SSMD format (convenience function).
+    Args:
+        ssml_text: SSML XML string
+        **config: Optional configuration parameters
+    Returns:
+        SSMD markdown string
+    Example:
+        >>> ssml = '<speak><emphasis>Hello</emphasis> world</speak>'
+        >>> ssmd.from_ssml(ssml)
+        '*Hello* world'
+    """
+    parser = SSMLParser(config)
+    return parser.to_ssmd(ssml_text)
+__all__ = [
+    "Document",
+    "to_ssml",
+    "to_text",
+    "from_ssml",
+    "SSMLParser",
+    "TTSCapabilities",
+    "get_preset",
+    # Capability presets
+    "ESPEAK_CAPABILITIES",
+    "PYTTSX3_CAPABILITIES",
+    "GOOGLE_TTS_CAPABILITIES",
+    "AMAZON_POLLY_CAPABILITIES",
+    "AZURE_TTS_CAPABILITIES",
+    "MINIMAL_CAPABILITIES",
+    "FULL_CAPABILITIES",
+    # Parser functions
+    "parse_sentences",
+    "parse_segments",
+    "parse_voice_blocks",
+    "format_ssmd",
+    # Utility functions
+    "escape_ssmd_syntax",
+    "unescape_ssmd_syntax",
+    # New core classes
+    "Segment",
+    "Sentence",
+    # Types
+    "VoiceAttrs",
+    "ProsodyAttrs",
+    "BreakAttrs",
+    "SayAsAttrs",
+    "AudioAttrs",
+    "PhonemeAttrs",
+    "HeadingConfig",
+    "DEFAULT_HEADING_LEVELS",
+    # Backward compatibility aliases
+    "SSMDSegment",
+    "SSMDSentence",
+    "__version__",
+]

ssmd/_version.py ADDED Viewed

@@ -0,0 +1,34 @@
+# file generated by setuptools-scm
+# don't change, don't track in version control
+__all__ = [
+    "__version__",
+    "__version_tuple__",
+    "version",
+    "version_tuple",
+    "__commit_id__",
+    "commit_id",
+]
+TYPE_CHECKING = False
+if TYPE_CHECKING:
+    from typing import Tuple
+    from typing import Union
+    VERSION_TUPLE = Tuple[Union[int, str], ...]
+    COMMIT_ID = Union[str, None]
+else:
+    VERSION_TUPLE = object
+    COMMIT_ID = object
+version: str
+__version__: str
+__version_tuple__: VERSION_TUPLE
+version_tuple: VERSION_TUPLE
+commit_id: COMMIT_ID
+__commit_id__: COMMIT_ID
+__version__ = version = '0.5.3'
+__version_tuple__ = version_tuple = (0, 5, 3)
+__commit_id__ = commit_id = None

ssmd/capabilities.py ADDED Viewed

@@ -0,0 +1,277 @@
+"""TTS capability definitions and presets.
+This module defines which SSML features are supported by various TTS engines
+and provides capability-based filtering for SSMD processing.
+"""
+from typing import Any
+class TTSCapabilities:
+    """Define TTS engine capabilities.
+    This class allows you to specify which SSML features your TTS engine
+    supports. Unsupported features will be automatically stripped to plain text.
+    Example:
+        >>> # Basic TTS with minimal support
+        >>> caps = TTSCapabilities(
+        ...     emphasis=False,
+        ...     break_tags=True,
+        ...     prosody=False
+        ... )
+        >>>
+        >>> parser = SSMD(capabilities=caps)
+        >>> ssml = parser.to_ssml("Hello *world*!")
+        >>> # Output: <speak><p>Hello world!</p></speak>
+        >>> # (emphasis stripped because not supported)
+    """
+    def __init__(
+        self,
+        # Core features
+        emphasis: bool = True,
+        break_tags: bool = True,
+        paragraph: bool = True,
+        # Language & pronunciation
+        language: bool = True,
+        phoneme: bool = True,
+        substitution: bool = True,
+        # Prosody (volume, rate, pitch)
+        prosody: bool = True,
+        prosody_volume: bool = True,
+        prosody_rate: bool = True,
+        prosody_pitch: bool = True,
+        # Advanced features
+        say_as: bool = True,
+        audio: bool = True,
+        mark: bool = True,
+        # Extensions (platform-specific)
+        extensions: dict[str, bool] | None = None,
+        # Sentence and heading support
+        sentence_tags: bool = True,
+        heading_emphasis: bool = True,
+    ):
+        """Initialize TTS capabilities.
+        Args:
+            emphasis: Support for <emphasis> tags
+            break_tags: Support for <break> tags
+            paragraph: Support for <p> tags
+            language: Support for <lang> tags
+            phoneme: Support for <phoneme> tags
+            substitution: Support for <sub> tags
+            prosody: Support for <prosody> tags (general)
+            prosody_volume: Support for volume attribute
+            prosody_rate: Support for rate attribute
+            prosody_pitch: Support for pitch attribute
+            say_as: Support for <say-as> tags
+            audio: Support for <audio> tags
+            mark: Support for <mark> tags
+            extensions: Dict of extension names and their support
+            sentence_tags: Support for <s> tags
+            heading_emphasis: Support for heading emphasis
+        """
+        self.emphasis = emphasis
+        self.break_tags = break_tags
+        self.paragraph = paragraph
+        self.language = language
+        self.phoneme = phoneme
+        self.substitution = substitution
+        self.prosody = prosody
+        self.prosody_volume = prosody_volume and prosody
+        self.prosody_rate = prosody_rate and prosody
+        self.prosody_pitch = prosody_pitch and prosody
+        self.say_as = say_as
+        self.audio = audio
+        self.mark = mark
+        self.extensions = extensions or {}
+        self.sentence_tags = sentence_tags
+        self.heading_emphasis = heading_emphasis
+    def to_config(self) -> dict[str, Any]:
+        """Convert capabilities to SSMD config.
+        Returns:
+            Configuration dict for SSMD converter
+        """
+        config: dict[str, Any] = {
+            "skip": [],
+            "capabilities": self,
+        }
+        # Skip processors for unsupported features
+        if not self.emphasis:
+            config["skip"].append("emphasis")
+        if not self.break_tags:
+            config["skip"].append("break")
+        if not self.paragraph:
+            config["skip"].append("paragraph")
+        if not self.mark:
+            config["skip"].append("mark")
+        # Prosody is handled specially (selective attributes)
+        if not self.prosody:
+            config["skip"].append("prosody")
+        # Headings handled by modifying heading_levels
+        if not self.heading_emphasis:
+            config["heading_levels"] = {}  # No heading processing
+        return config
+    def supports_extension(self, extension_name: str) -> bool:
+        """Check if an extension is supported.
+        Args:
+            extension_name: Name of the extension
+        Returns:
+            True if supported
+        """
+        return self.extensions.get(extension_name, False)
+# Preset capability definitions for common TTS engines
+ESPEAK_CAPABILITIES = TTSCapabilities(
+    emphasis=False,  # eSpeak doesn't support emphasis
+    break_tags=True,
+    paragraph=False,  # eSpeak treats paragraphs as plain text
+    language=True,
+    phoneme=True,  # eSpeak has good phoneme support
+    substitution=False,
+    prosody=True,
+    prosody_volume=True,
+    prosody_rate=True,
+    prosody_pitch=True,
+    say_as=False,
+    audio=False,  # No audio file support
+    mark=False,
+    sentence_tags=False,
+    heading_emphasis=False,
+)
+PYTTSX3_CAPABILITIES = TTSCapabilities(
+    emphasis=False,  # pyttsx3 has minimal SSML support
+    break_tags=False,
+    paragraph=False,
+    language=False,  # Voice selection, not SSML
+    phoneme=False,
+    substitution=False,
+    prosody=True,  # Via properties, not SSML
+    prosody_volume=True,
+    prosody_rate=True,
+    prosody_pitch=False,
+    say_as=False,
+    audio=False,
+    mark=False,
+    sentence_tags=False,
+    heading_emphasis=False,
+)
+GOOGLE_TTS_CAPABILITIES = TTSCapabilities(
+    emphasis=True,
+    break_tags=True,
+    paragraph=True,
+    language=True,
+    phoneme=True,
+    substitution=True,
+    prosody=True,
+    prosody_volume=True,
+    prosody_rate=True,
+    prosody_pitch=True,
+    say_as=True,
+    audio=True,
+    mark=True,
+    sentence_tags=True,
+    heading_emphasis=True,
+)
+AMAZON_POLLY_CAPABILITIES = TTSCapabilities(
+    emphasis=True,
+    break_tags=True,
+    paragraph=True,
+    language=True,
+    phoneme=True,
+    substitution=True,
+    prosody=True,
+    prosody_volume=True,
+    prosody_rate=True,
+    prosody_pitch=True,
+    say_as=True,
+    audio=False,  # Limited audio support
+    mark=True,
+    extensions={"whisper": True, "drc": True},  # Amazon-specific
+    sentence_tags=True,
+    heading_emphasis=True,
+)
+AZURE_TTS_CAPABILITIES = TTSCapabilities(
+    emphasis=True,
+    break_tags=True,
+    paragraph=True,
+    language=True,
+    phoneme=True,
+    substitution=True,
+    prosody=True,
+    prosody_volume=True,
+    prosody_rate=True,
+    prosody_pitch=True,
+    say_as=True,
+    audio=True,
+    mark=True,
+    sentence_tags=True,
+    heading_emphasis=True,
+)
+# Minimal fallback (plain text only)
+MINIMAL_CAPABILITIES = TTSCapabilities(
+    emphasis=False,
+    break_tags=False,
+    paragraph=False,
+    language=False,
+    phoneme=False,
+    substitution=False,
+    prosody=False,
+    say_as=False,
+    audio=False,
+    mark=False,
+    sentence_tags=False,
+    heading_emphasis=False,
+)
+# Full SSML support (reference)
+FULL_CAPABILITIES = TTSCapabilities()
+# Preset lookup
+PRESETS: dict[str, TTSCapabilities] = {
+    "espeak": ESPEAK_CAPABILITIES,
+    "pyttsx3": PYTTSX3_CAPABILITIES,
+    "google": GOOGLE_TTS_CAPABILITIES,
+    "polly": AMAZON_POLLY_CAPABILITIES,
+    "amazon": AMAZON_POLLY_CAPABILITIES,
+    "azure": AZURE_TTS_CAPABILITIES,
+    "microsoft": AZURE_TTS_CAPABILITIES,
+    "minimal": MINIMAL_CAPABILITIES,
+    "full": FULL_CAPABILITIES,
+}
+def get_preset(name: str) -> TTSCapabilities:
+    """Get a preset capability configuration.
+    Args:
+        name: Preset name (espeak, pyttsx3, google, polly, azure, minimal, full)
+    Returns:
+        TTSCapabilities instance
+    Raises:
+        ValueError: If preset not found
+    """
+    if name.lower() not in PRESETS:
+        available = ", ".join(PRESETS.keys())
+        raise ValueError(f"Unknown preset '{name}'. Available: {available}")
+    return PRESETS[name.lower()]