phoonnx 0.1.0a3__tar.gz → 0.1.1a1__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (94) hide show
  1. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/PKG-INFO +2 -1
  2. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/README.md +1 -0
  3. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/config.py +7 -0
  4. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/phonemizers/__init__.py +4 -1
  5. phoonnx-0.1.1a1/phoonnx/phonemizers/mwl.py +36 -0
  6. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/version.py +3 -3
  7. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx.egg-info/PKG-INFO +2 -1
  8. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx.egg-info/SOURCES.txt +2 -0
  9. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx.egg-info/requires.txt +3 -0
  10. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/__init__.py +0 -0
  11. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/locale/ca/phonetic_spellings.txt +0 -0
  12. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/locale/en/phonetic_spellings.txt +0 -0
  13. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/locale/gl/phonetic_spellings.txt +0 -0
  14. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/locale/pt/phonetic_spellings.txt +0 -0
  15. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/phoneme_ids.py +0 -0
  16. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/phonemizers/ar.py +0 -0
  17. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/phonemizers/base.py +0 -0
  18. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/phonemizers/en.py +0 -0
  19. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/phonemizers/fa.py +0 -0
  20. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/phonemizers/gl.py +0 -0
  21. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/phonemizers/he.py +0 -0
  22. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/phonemizers/ja.py +0 -0
  23. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/phonemizers/ko.py +0 -0
  24. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/phonemizers/mul.py +0 -0
  25. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/phonemizers/vi.py +0 -0
  26. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/phonemizers/zh.py +0 -0
  27. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/thirdparty/__init__.py +0 -0
  28. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/thirdparty/arpa2ipa.py +0 -0
  29. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/thirdparty/bw2ipa.py +0 -0
  30. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/thirdparty/cotovia/cotovia_aarch64 +0 -0
  31. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/thirdparty/cotovia/cotovia_x86_64 +0 -0
  32. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/thirdparty/hangul2ipa.py +0 -0
  33. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/thirdparty/ko_tables/aspiration.csv +0 -0
  34. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/thirdparty/ko_tables/assimilation.csv +0 -0
  35. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/thirdparty/ko_tables/double_coda.csv +0 -0
  36. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/thirdparty/ko_tables/hanja.tsv +0 -0
  37. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/thirdparty/ko_tables/ipa.csv +0 -0
  38. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/thirdparty/ko_tables/neutralization.csv +0 -0
  39. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/thirdparty/ko_tables/tensification.csv +0 -0
  40. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/thirdparty/ko_tables/yale.csv +0 -0
  41. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/thirdparty/kog2p/__init__.py +0 -0
  42. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/thirdparty/kog2p/rulebook.txt +0 -0
  43. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/thirdparty/mantoq/__init__.py +0 -0
  44. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/thirdparty/mantoq/buck/__init__.py +0 -0
  45. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/thirdparty/mantoq/buck/phonetise_buckwalter.py +0 -0
  46. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/thirdparty/mantoq/buck/symbols.py +0 -0
  47. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/thirdparty/mantoq/buck/tokenization.py +0 -0
  48. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/thirdparty/mantoq/num2words.py +0 -0
  49. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/thirdparty/mantoq/pyarabic/__init__.py +0 -0
  50. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/thirdparty/mantoq/pyarabic/arabrepr.py +0 -0
  51. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/thirdparty/mantoq/pyarabic/araby.py +0 -0
  52. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/thirdparty/mantoq/pyarabic/named_const.py +0 -0
  53. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/thirdparty/mantoq/pyarabic/normalize.py +0 -0
  54. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/thirdparty/mantoq/pyarabic/number.py +0 -0
  55. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/thirdparty/mantoq/pyarabic/number_const.py +0 -0
  56. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/thirdparty/mantoq/pyarabic/stack.py +0 -0
  57. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/thirdparty/mantoq/pyarabic/trans.py +0 -0
  58. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/thirdparty/mantoq/unicode_symbol2label.py +0 -0
  59. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/thirdparty/phonikud/__init__.py +0 -0
  60. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/thirdparty/tashkeel/LICENSE +0 -0
  61. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/thirdparty/tashkeel/SOURCE +0 -0
  62. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/thirdparty/tashkeel/__init__.py +0 -0
  63. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/thirdparty/tashkeel/hint_id_map.json +0 -0
  64. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/thirdparty/tashkeel/input_id_map.json +0 -0
  65. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/thirdparty/tashkeel/model.onnx +0 -0
  66. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/thirdparty/tashkeel/target_id_map.json +0 -0
  67. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/thirdparty/zh_num.py +0 -0
  68. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/util.py +0 -0
  69. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx/voice.py +0 -0
  70. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx.egg-info/dependency_links.txt +0 -0
  71. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx.egg-info/top_level.txt +0 -0
  72. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx_train/__main__.py +0 -0
  73. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx_train/export_onnx.py +0 -0
  74. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx_train/norm_audio/__init__.py +0 -0
  75. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx_train/norm_audio/trim.py +0 -0
  76. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx_train/norm_audio/vad.py +0 -0
  77. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx_train/preprocess.py +0 -0
  78. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx_train/vits/__init__.py +0 -0
  79. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx_train/vits/attentions.py +0 -0
  80. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx_train/vits/commons.py +0 -0
  81. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx_train/vits/config.py +0 -0
  82. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx_train/vits/dataset.py +0 -0
  83. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx_train/vits/lightning.py +0 -0
  84. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx_train/vits/losses.py +0 -0
  85. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx_train/vits/mel_processing.py +0 -0
  86. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx_train/vits/models.py +0 -0
  87. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx_train/vits/modules.py +0 -0
  88. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx_train/vits/monotonic_align/__init__.py +0 -0
  89. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx_train/vits/monotonic_align/setup.py +0 -0
  90. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx_train/vits/transforms.py +0 -0
  91. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx_train/vits/utils.py +0 -0
  92. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/phoonnx_train/vits/wavfile.py +0 -0
  93. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/setup.cfg +0 -0
  94. {phoonnx-0.1.0a3 → phoonnx-0.1.1a1}/setup.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: phoonnx
3
- Version: 0.1.0a3
3
+ Version: 0.1.1a1
4
4
  Home-page: https://github.com/TigreGotico/phoonnx
5
5
  Author: JarbasAi
6
6
  Author-email: jarbasai@mailfence.com
@@ -41,6 +41,7 @@ Provides-Extra: jam
41
41
  Provides-Extra: hsn
42
42
  Provides-Extra: fil
43
43
  Provides-Extra: ml
44
+ Provides-Extra: mwl
44
45
  Provides-Extra: lez
45
46
  Provides-Extra: si
46
47
  Provides-Extra: kk
@@ -89,6 +89,7 @@ wrap, and the output alphabets they can generate.
89
89
  | **Multilingual** | `MisakiPhonemizer` | [misaki](https://github.com/hexgrad/misaki) | IPA | Misaki is a G2P engine designed for Kokoro models. |
90
90
  | **Multilingual** | `TransphonePhonemizer` | [transphone](https://github.com/xinjli/transphone) | IPA | It provides approximated phoneme tokenizers and G2P model for 7546 languages registered in the Glottolog database. |
91
91
  | **Multilingual** | `EpitranPhonemizer` | [epitran](https://github.com/dmort27/epitran) | IPA | A tool for transcribing orthographic text as IPA |
92
+ | **Mirandese (mwl)** | `MirandesePhonemizer` | [mwl_phonemizer](https://github.com/TigreGotico/mwl_phonemizer) | IPA | A tool for transcribing orthographic text as IPA |
92
93
  | **Arabic (ar)** | `MantoqPhonemizer` | [mantoq](https://github.com/mush42/mantoq) | BUCKWALTER, IPA | Translates unvoweled Arabic to phonemes, with optional conversion to IPA. |
93
94
  | **Chinese (zh)** | `JiebaPhonemizer` | [jieba](https://github.com/fxsjy/jieba) | HANZI | Segments Chinese text into words with spaces; useful for pre-processing. |
94
95
  | **Chinese (zh)** | `G2pMPhonemizer` | [g2pC](https://github.com/Kyubyong/g2pC) | IPA, Pinyin | CRF-based Grapheme-to-Phoneme converter |
@@ -48,6 +48,8 @@ class PhonemeType(str, Enum):
48
48
  EPITRAN = "epitran"
49
49
  BYT5 = "byt5"
50
50
  CHARSIU = "charsiu" # technically same as byt5, but needs special handling for whitespace
51
+ TRANSPHONE = "transphone"
52
+ MIRANDESE = "mwl_phonemizer"
51
53
 
52
54
  DEEPPHONEMIZER = "deepphonemizer" # en
53
55
  OPENPHONEMIZER = "openphonemizer" # en
@@ -392,6 +394,7 @@ def get_phonemizer(phoneme_type: PhonemeType,
392
394
  from phoonnx.phonemizers import (EpitranPhonemizer, EspeakPhonemizer, OpenPhonemizer, OpenJTaklPhonemizer,
393
395
  ByT5Phonemizer, CharsiuPhonemizer, DeepPhonemizer, PersianPhonemizer,
394
396
  G2pCPhonemizer, G2pMPhonemizer, G2PKPhonemizer, G2PEnPhonemizer,
397
+ TransphonePhonemizer, MirandesePhonemizer,
395
398
  GruutPhonemizer, GraphemePhonemizer, MantoqPhonemizer, MisakiPhonemizer,
396
399
  KoG2PPhonemizer, PypinyinPhonemizer, PyKakasiPhonemizer, CotoviaPhonemizer,
397
400
  CutletPhonemizer, PhonikudPhonemizer, VIPhonemePhonemizer, XpinyinPhonemizer,
@@ -408,6 +411,10 @@ def get_phonemizer(phoneme_type: PhonemeType,
408
411
  phonemizer = EpitranPhonemizer()
409
412
  elif phoneme_type == PhonemeType.MISAKI:
410
413
  phonemizer = MisakiPhonemizer()
414
+ elif phoneme_type == PhonemeType.TRANSPHONE:
415
+ phonemizer = TransphonePhonemizer()
416
+ elif phoneme_type == PhonemeType.MIRANDESE:
417
+ phonemizer = MirandesePhonemizer()
411
418
  elif phoneme_type == PhonemeType.DEEPPHONEMIZER:
412
419
  phonemizer = DeepPhonemizer(model)
413
420
  elif phoneme_type == PhonemeType.OPENPHONEMIZER:
@@ -12,7 +12,8 @@ from phoonnx.phonemizers.ko import KoG2PPhonemizer, G2PKPhonemizer
12
12
  from phoonnx.phonemizers.zh import (G2pCPhonemizer, G2pMPhonemizer, PypinyinPhonemizer,
13
13
  XpinyinPhonemizer, JiebaPhonemizer)
14
14
  from phoonnx.phonemizers.mul import (EspeakPhonemizer, EpitranPhonemizer, MisakiPhonemizer,
15
- GruutPhonemizer, ByT5Phonemizer, CharsiuPhonemizer)
15
+ GruutPhonemizer, ByT5Phonemizer, CharsiuPhonemizer, TransphonePhonemizer)
16
+ from phoonnx.phonemizers.mwl import MirandesePhonemizer
16
17
 
17
18
  Phonemizer = Union[
18
19
  MisakiPhonemizer,
@@ -22,6 +23,8 @@ Phonemizer = Union[
22
23
  EspeakPhonemizer,
23
24
  GruutPhonemizer,
24
25
  EpitranPhonemizer,
26
+ TransphonePhonemizer,
27
+ MirandesePhonemizer,
25
28
  OpenJTaklPhonemizer,
26
29
  CutletPhonemizer,
27
30
  PyKakasiPhonemizer,
@@ -0,0 +1,36 @@
1
+ from phoonnx.phonemizers.base import BasePhonemizer, Alphabet
2
+ from mwl_phonemizer import CRFOrthoCorrector
3
+
4
+
5
+ class MirandesePhonemizer(BasePhonemizer):
6
+ _LANGS = ["mwl"]
7
+
8
+ def __init__(self):
9
+ super().__init__(Alphabet.IPA)
10
+ self.pho = CRFOrthoCorrector()
11
+
12
+ @classmethod
13
+ def get_lang(cls, target_lang: str) -> str:
14
+ """
15
+ Validates and returns the closest supported language code.
16
+
17
+ Args:
18
+ target_lang (str): The language code to validate.
19
+
20
+ Returns:
21
+ str: The validated language code.
22
+
23
+ Raises:
24
+ ValueError: If the language code is unsupported.
25
+ """
26
+ return cls.match_lang(target_lang, cls._LANGS)
27
+
28
+ def phonemize_string(self, text: str, lang: str) -> str:
29
+ # Validate language is supported
30
+ lang = self.get_lang(lang)
31
+ return self.pho.phonemize_sentence(text)
32
+
33
+
34
+ if __name__ == "__main__":
35
+ pho = MirandesePhonemizer()
36
+ print(pho.phonemize_string("ls", "mwl"))
@@ -1,10 +1,10 @@
1
1
  # START_VERSION_BLOCK
2
2
  VERSION_MAJOR = 0
3
3
  VERSION_MINOR = 1
4
- VERSION_BUILD = 0
5
- VERSION_ALPHA = 3
4
+ VERSION_BUILD = 1
5
+ VERSION_ALPHA = 1
6
6
  # END_VERSION_BLOCK
7
7
 
8
8
  VERSION_STR = f"{VERSION_MAJOR}.{VERSION_MINOR}.{VERSION_BUILD}"
9
9
  if VERSION_ALPHA:
10
- VERSION_STR += f"a{VERSION_ALPHA}"
10
+ VERSION_STR += f"a{VERSION_ALPHA}"
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: phoonnx
3
- Version: 0.1.0a3
3
+ Version: 0.1.1a1
4
4
  Home-page: https://github.com/TigreGotico/phoonnx
5
5
  Author: JarbasAi
6
6
  Author-email: jarbasai@mailfence.com
@@ -41,6 +41,7 @@ Provides-Extra: jam
41
41
  Provides-Extra: hsn
42
42
  Provides-Extra: fil
43
43
  Provides-Extra: ml
44
+ Provides-Extra: mwl
44
45
  Provides-Extra: lez
45
46
  Provides-Extra: si
46
47
  Provides-Extra: kk
@@ -25,6 +25,7 @@ phoonnx/phonemizers/he.py
25
25
  phoonnx/phonemizers/ja.py
26
26
  phoonnx/phonemizers/ko.py
27
27
  phoonnx/phonemizers/mul.py
28
+ phoonnx/phonemizers/mwl.py
28
29
  phoonnx/phonemizers/vi.py
29
30
  phoonnx/phonemizers/zh.py
30
31
  phoonnx/thirdparty/__init__.py
@@ -91,6 +92,7 @@ phoonnx_train/../phoonnx/phonemizers/he.py
91
92
  phoonnx_train/../phoonnx/phonemizers/ja.py
92
93
  phoonnx_train/../phoonnx/phonemizers/ko.py
93
94
  phoonnx_train/../phoonnx/phonemizers/mul.py
95
+ phoonnx_train/../phoonnx/phonemizers/mwl.py
94
96
  phoonnx_train/../phoonnx/phonemizers/vi.py
95
97
  phoonnx_train/../phoonnx/phonemizers/zh.py
96
98
  phoonnx_train/../phoonnx/thirdparty/__init__.py
@@ -206,6 +206,9 @@ epitran
206
206
  [mt]
207
207
  epitran
208
208
 
209
+ [mwl]
210
+ mwl_phonemizer
211
+
209
212
  [my]
210
213
  epitran
211
214
 
File without changes
File without changes
File without changes
File without changes
File without changes