PyPI - kernpy - Versions diffs - 0.0.2__py3-none-any.whl → 1.0.0__py3-none-any.whl - Mend

kernpy 0.0.2py3-none-any.whl → 1.0.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (56) hide show

kernpy/__init__.py +215 -0
kernpy/__main__.py +217 -0
kernpy/core/__init__.py +119 -0
kernpy/core/_io.py +48 -0
kernpy/core/base_antlr_importer.py +61 -0
kernpy/core/base_antlr_spine_parser_listener.py +196 -0
kernpy/core/basic_spine_importer.py +43 -0
kernpy/core/document.py +965 -0
kernpy/core/dyn_importer.py +30 -0
kernpy/core/dynam_spine_importer.py +42 -0
kernpy/core/error_listener.py +51 -0
kernpy/core/exporter.py +535 -0
kernpy/core/fing_spine_importer.py +42 -0
kernpy/core/generated/kernSpineLexer.interp +444 -0
kernpy/core/generated/kernSpineLexer.py +535 -0
kernpy/core/generated/kernSpineLexer.tokens +236 -0
kernpy/core/generated/kernSpineParser.interp +425 -0
kernpy/core/generated/kernSpineParser.py +9954 -0
kernpy/core/generated/kernSpineParser.tokens +236 -0
kernpy/core/generated/kernSpineParserListener.py +1200 -0
kernpy/core/generated/kernSpineParserVisitor.py +673 -0
kernpy/core/generic.py +426 -0
kernpy/core/gkern.py +526 -0
kernpy/core/graphviz_exporter.py +89 -0
kernpy/core/harm_spine_importer.py +41 -0
kernpy/core/import_humdrum_old.py +853 -0
kernpy/core/importer.py +285 -0
kernpy/core/importer_factory.py +43 -0
kernpy/core/kern_spine_importer.py +73 -0
kernpy/core/mens_spine_importer.py +23 -0
kernpy/core/mhxm_spine_importer.py +44 -0
kernpy/core/pitch_models.py +338 -0
kernpy/core/root_spine_importer.py +58 -0
kernpy/core/spine_importer.py +45 -0
kernpy/core/text_spine_importer.py +43 -0
kernpy/core/tokenizers.py +239 -0
kernpy/core/tokens.py +2011 -0
kernpy/core/transposer.py +300 -0
kernpy/io/__init__.py +14 -0
kernpy/io/public.py +355 -0
kernpy/polish_scores/__init__.py +13 -0
kernpy/polish_scores/download_polish_dataset.py +357 -0
kernpy/polish_scores/iiif.py +47 -0
kernpy/test_grammar.sh +22 -0
kernpy/util/__init__.py +14 -0
kernpy/util/helpers.py +55 -0
kernpy/util/store_cache.py +35 -0
kernpy/visualize_analysis.sh +23 -0
kernpy-1.0.0.dist-info/METADATA +501 -0
kernpy-1.0.0.dist-info/RECORD +51 -0
{kernpy-0.0.2.dist-info → kernpy-1.0.0.dist-info}/WHEEL +1 -2
kernpy/example.py +0 -1
kernpy-0.0.2.dist-info/LICENSE +0 -19
kernpy-0.0.2.dist-info/METADATA +0 -19
kernpy-0.0.2.dist-info/RECORD +0 -7
kernpy-0.0.2.dist-info/top_level.txt +0 -1

kernpy/core/tokenizers.py ADDED Viewed

@@ -0,0 +1,239 @@
+from __future__ import annotations
+from copy import deepcopy
+from enum import Enum
+from abc import ABC, abstractmethod
+from typing import List, Union, Set
+from kernpy.core import DECORATION_SEPARATOR, Token, TOKEN_SEPARATOR
+class Encoding(Enum):  # TODO: Eventually, polymorphism will be used to export different types of kern files
+    """
+    Options for exporting a kern file.
+    Example:
+        >>> import kernpy as kp
+        >>> # Load a file
+        >>> doc, _ = kp.load('path/to/file.krn')
+        >>>
+        >>> # Save the file using the specified encoding
+        >>> exported_content = kp.dumps(tokenizer=kp.Encoding.normalizedKern)
+    """
+    eKern = 'ekern'
+    normalizedKern = 'kern'
+    bKern = 'bkern'
+    bEkern = 'bekern'
+    def prefix(self) -> str:
+        """
+        Get the prefix of the kern type.
+        Returns (str): Prefix of the kern type.
+        """
+        if self == Encoding.eKern:
+            return 'e'
+        elif self == Encoding.normalizedKern:
+            return ''
+        elif self == Encoding.bKern:
+            return 'b'
+        elif self == Encoding.bEkern:
+            return 'be'
+        else:
+            raise ValueError(f'Unknown kern type: {self}. '
+                             f'Supported types are: '
+                             f"{'-'.join([kern_type.name for kern_type in Encoding.__members__.values()])}")
+class Tokenizer(ABC):
+    """
+    Tokenizer interface. All tokenizers must implement this interface.
+    Tokenizers are responsible for converting a token into a string representation.
+    """
+    def __init__(self, *, token_categories: Set['TokenCategory']):
+        """
+        Create a new Tokenizer.
+        Args:
+            token_categories Set[TokenCategory]: List of categories to be tokenized.
+                If None, an exception will be raised.
+        """
+        if token_categories is None:
+            raise ValueError('Categories must be provided. Found None.')
+        self.token_categories = token_categories
+    @abstractmethod
+    def tokenize(self, token: Token) -> str:
+        """
+        Tokenize a token into a string representation.
+        Args:
+            token (Token): Token to be tokenized.
+        Returns (str): Tokenized string representation.
+        """
+        pass
+class KernTokenizer(Tokenizer):
+    """
+    KernTokenizer converts a Token into a normalized kern string representation.
+    """
+    def __init__(self, *, token_categories: Set['TokenCategory']):
+        """
+        Create a new KernTokenizer.
+        Args:
+            token_categories (Set[TokenCategory]): List of categories to be tokenized. If None will raise an exception.
+        """
+        super().__init__(token_categories=token_categories)
+    def tokenize(self, token: Token) -> str:
+        """
+        Tokenize a token into a normalized kern string representation.
+        This format is the classic Humdrum **kern representation.
+        Args:
+            token (Token): Token to be tokenized.
+        Returns (str): Normalized kern string representation. This is the classic Humdrum **kern representation.
+        Examples:
+            >>> token.encoding
+            '2@.@bb@-·_·L'
+            >>> KernTokenizer().tokenize(token)
+            '2.bb-_L'
+        """
+        return EkernTokenizer(token_categories=self.token_categories).tokenize(token).replace(TOKEN_SEPARATOR, '').replace(DECORATION_SEPARATOR, '')
+class EkernTokenizer(Tokenizer):
+    """
+    EkernTokenizer converts a Token into an eKern (Extended **kern) string representation. This format use a '@' separator for the \
+    main tokens and a '·' separator for the decorations tokens.
+    """
+    def __init__(self, *, token_categories: Set['TokenCategory']):
+        """
+        Create a new EkernTokenizer
+        Args:
+            token_categories (List[TokenCategory]): List of categories to be tokenized. If None will raise an exception.
+        """
+        super().__init__(token_categories=token_categories)
+    def tokenize(self, token: Token) -> str:
+        """
+        Tokenize a token into an eKern string representation.
+        Args:
+            token (Token): Token to be tokenized.
+        Returns (str): eKern string representation.
+        Examples:
+            >>> token.encoding
+            '2@.@bb@-·_·L'
+            >>> EkernTokenizer().tokenize(token)
+            '2@.@bb@-·_·L'
+        """
+        return token.export(filter_categories=lambda cat: cat in self.token_categories)
+class BekernTokenizer(Tokenizer):
+    """
+    BekernTokenizer converts a Token into a bekern (Basic Extended **kern) string representation. This format use a '@' separator for the \
+    main tokens but discards all the decorations tokens.
+    """
+    def __init__(self, *, token_categories: Set['TokenCategory']):
+        """
+        Create a new BekernTokenizer
+        Args:
+            token_categories (Set[TokenCategory]): List of categories to be tokenized. If None will raise an exception.
+        """
+        super().__init__(token_categories=token_categories)
+    def tokenize(self, token: Token) -> str:
+        """
+        Tokenize a token into a bekern string representation.
+        Args:
+            token (Token): Token to be tokenized.
+        Returns (str): bekern string representation.
+        Examples:
+            >>> token.encoding
+            '2@.@bb@-·_·L'
+            >>> BekernTokenizer().tokenize(token)
+            '2@.@bb@-'
+        """
+        ekern_content = token.export(filter_categories=lambda cat: cat in self.token_categories)
+        if DECORATION_SEPARATOR not in ekern_content:
+            return ekern_content
+        reduced_content = ekern_content.split(DECORATION_SEPARATOR)[0]
+        if reduced_content.endswith(TOKEN_SEPARATOR):
+            reduced_content = reduced_content[:-1]
+        return reduced_content
+class BkernTokenizer(Tokenizer):
+    """
+    BkernTokenizer converts a Token into a bkern (Basic **kern) string representation. This format use \
+    the main tokens but not the decorations tokens. This format is a lightweight version of the classic
+    Humdrum **kern format.
+    """
+    def __init__(self, *, token_categories: Set['TokenCategory']):
+        """
+        Create a new BkernTokenizer
+        Args:
+            token_categories (Set[TokenCategory]): List of categories to be tokenized. If None will raise an exception.
+        """
+        super().__init__(token_categories=token_categories)
+    def tokenize(self, token: Token) -> str:
+        """
+        Tokenize a token into a bkern string representation.
+        Args:
+            token (Token): Token to be tokenized.
+        Returns (str): bkern string representation.
+        Examples:
+            >>> token.encoding
+            '2@.@bb@-·_·L'
+            >>> BkernTokenizer().tokenize(token)
+            '2.bb-'
+        """
+        return BekernTokenizer(token_categories=self.token_categories).tokenize(token).replace(TOKEN_SEPARATOR, '')
+class TokenizerFactory:
+    @classmethod
+    def create(cls, type: str, *, token_categories: List['TokenCategory']) -> Tokenizer:
+        if type is None:
+            raise ValueError('A tokenization type must be provided. Found None.')
+        if type == Encoding.normalizedKern.value:
+            return KernTokenizer(token_categories=token_categories)
+        elif type == Encoding.eKern.value:
+            return EkernTokenizer(token_categories=token_categories)
+        elif type == Encoding.bKern.value:
+            return BekernTokenizer(token_categories=token_categories)
+        elif type == Encoding.bEkern.value:
+            return BkernTokenizer(token_categories=token_categories)
+        raise ValueError(f"Unknown kern type: {type}. "
+                         f"Supported types are: "
+                         f"{'-'.join([kern_type.name for kern_type in Encoding.__members__.values()])}")

kernpy 0.0.2__py3-none-any.whl → 1.0.0__py3-none-any.whl

kernpy 0.0.2py3-none-any.whl → 1.0.0py3-none-any.whl