phoonnx 0.2.4a1__py3-none-any.whl → 0.2.6__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
phoonnx/version.py CHANGED
@@ -1,8 +1,8 @@
1
1
  # START_VERSION_BLOCK
2
2
  VERSION_MAJOR = 0
3
3
  VERSION_MINOR = 2
4
- VERSION_BUILD = 4
5
- VERSION_ALPHA = 1
4
+ VERSION_BUILD = 6
5
+ VERSION_ALPHA = 0
6
6
  # END_VERSION_BLOCK
7
7
 
8
8
  VERSION_STR = f"{VERSION_MAJOR}.{VERSION_MINOR}.{VERSION_BUILD}"
phoonnx/voice.py CHANGED
@@ -203,7 +203,6 @@ class TTSVoice:
203
203
  phonemes = self.phonemizer.phonemize(
204
204
  text_part, self.config.lang_code
205
205
  )
206
- phonemes.extend(phonemes)
207
206
 
208
207
  if phonemes and (not phonemes[-1]):
209
208
  # Remove empty phonemes
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: phoonnx
3
- Version: 0.2.4a1
3
+ Version: 0.2.6
4
4
  Home-page: https://github.com/TigreGotico/phoonnx
5
5
  Author: JarbasAi
6
6
  Author-email: jarbasai@mailfence.com
@@ -2,8 +2,8 @@ phoonnx/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
2
2
  phoonnx/config.py,sha256=DKgsU03g8jrAuMcVqbu-w3MWPXOUihFtRnavg6WGQ1Y,19983
3
3
  phoonnx/phoneme_ids.py,sha256=FiNgZwV6naEsBh6XwFLh3_FyOgPiCsK9qo7S0v-CmI4,13667
4
4
  phoonnx/util.py,sha256=XSjFEoqSFcujFTHxednacgC9GrSYyF-Il5L6Utmxmu4,25909
5
- phoonnx/version.py,sha256=VZdcd-pCi-vCStncJnB1n_gha4f3TNjR-W_dSyoACOw,237
6
- phoonnx/voice.py,sha256=JXjmbrhJd4mmTiLgz4O_Pa5_rKGUC9xzuBfqxYDw3Mg,19420
5
+ phoonnx/version.py,sha256=Ed7aHpgOwiCu6_EBeRxVmQI4Pm7CgBOFmHep_sKNUO0,237
6
+ phoonnx/voice.py,sha256=Fh60o87-_sIw4zTP8NEGvEV7XzTC0FhW9Jkq7Fr60lQ,19382
7
7
  phoonnx/locale/ca/phonetic_spellings.txt,sha256=igv3t7jxLSRE5GHsdn57HOpxiWNcEmECPql6m02wbO0,47
8
8
  phoonnx/locale/en/phonetic_spellings.txt,sha256=xGQlWOABLzbttpQvopl9CU-NnwEJRqKx8iuylsdUoQA,27
9
9
  phoonnx/locale/gl/phonetic_spellings.txt,sha256=igv3t7jxLSRE5GHsdn57HOpxiWNcEmECPql6m02wbO0,47
@@ -62,8 +62,8 @@ phoonnx/thirdparty/tashkeel/hint_id_map.json,sha256=gJMdtTsfEDFgmmbyO2Shw315rkqK
62
62
  phoonnx/thirdparty/tashkeel/input_id_map.json,sha256=cnpJqjx-k53AbzKyfC4GxMS771ltzkv1EnYmHKc2w8M,628
63
63
  phoonnx/thirdparty/tashkeel/model.onnx,sha256=UsQNQsoJT_n_B6CR0KHq_XuqXPI4jmCpzIm6zY5elV8,4788213
64
64
  phoonnx/thirdparty/tashkeel/target_id_map.json,sha256=baNAJL_UwP9U91mLt01aAEBRRNdGr-csFB_O6roh7TA,181
65
- phoonnx_train/export_onnx.py,sha256=CPfgNEm0hnXPSlgme0R9jr-6jZ5fKFpG5DZJFMkC-h4,12820
66
- phoonnx_train/preprocess.py,sha256=T1YcM89bizARKMaqjDtr3JzidoNvAbm-3n3eClbzMsI,21880
65
+ phoonnx_train/export_onnx.py,sha256=UFn1id5-p9tIXxK9FvHOry59WkotNqXtupinkeKcSDs,12881
66
+ phoonnx_train/preprocess.py,sha256=VYyU8XaCroa6tnLhQkQJ8wq1w1Gf9PPnIIM1N0PIcNE,22042
67
67
  phoonnx_train/train.py,sha256=nsINvDQ3dYvBne5UWPgLZ0a4qZFdSsOKk8HzZHGTLY4,8757
68
68
  phoonnx_train/norm_audio/__init__.py,sha256=Al_YwqMnENXRWp0c79cDZqbdd7pFYARXKxCfBaedr1c,3030
69
69
  phoonnx_train/norm_audio/trim.py,sha256=_ZsE3SYhahQSdEdBLeSwyFJGcvEbt-5E_lnWwTT4tcY,1698
@@ -83,7 +83,7 @@ phoonnx_train/vits/utils.py,sha256=exiyrtPHbnnGvcHWSbaH9-gR6srH5ZPHlKiqV2IHUrQ,4
83
83
  phoonnx_train/vits/wavfile.py,sha256=oQZiTIrdw0oLTbcVwKfGXye1WtKte6qK_52qVwiMvfc,26396
84
84
  phoonnx_train/vits/monotonic_align/__init__.py,sha256=5IdAOD1Z7UloMb6d_9NRFsXoNIjEQ3h9mvOSh_AtO3k,636
85
85
  phoonnx_train/vits/monotonic_align/setup.py,sha256=0K5iJJ2mKIklx6ncEfCQS34skm5hHPiz9vRlQEvevvY,266
86
- phoonnx-0.2.4a1.dist-info/METADATA,sha256=p_Hn1MLi2aPfctGgz_APHUmfwxl8nBkjozwqdxbU4b4,8250
87
- phoonnx-0.2.4a1.dist-info/WHEEL,sha256=tZoeGjtWxWRfdplE7E3d45VPlLNQnvbKiYnx7gwAy8A,92
88
- phoonnx-0.2.4a1.dist-info/top_level.txt,sha256=ZrnHXe-4HqbOSX6fbdY-JiP7YEu2Bok9T0ji351MrmM,22
89
- phoonnx-0.2.4a1.dist-info/RECORD,,
86
+ phoonnx-0.2.6.dist-info/METADATA,sha256=Lg0o0_aPp_pb-Dhvcx3IMgw5LiDHWwbfyXIKF8blFWE,8248
87
+ phoonnx-0.2.6.dist-info/WHEEL,sha256=tZoeGjtWxWRfdplE7E3d45VPlLNQnvbKiYnx7gwAy8A,92
88
+ phoonnx-0.2.6.dist-info/top_level.txt,sha256=ZrnHXe-4HqbOSX6fbdY-JiP7YEu2Bok9T0ji351MrmM,22
89
+ phoonnx-0.2.6.dist-info/RECORD,,
@@ -113,7 +113,8 @@ def convert_to_piper(config_path: Path, output_path: Path = Path("piper.json"))
113
113
  "phoneme_map": {},
114
114
  "audio": config.get("audio", {}),
115
115
  "inference": config.get("inference", {}),
116
- "phoneme_id_map": {k: [v] for k, v in config.get("phoneme_id_map", {}).items()},
116
+ "phoneme_id_map": {k: [v] if not isinstance(v, list) else v
117
+ for k, v in config.get("phoneme_id_map", {}).items()},
117
118
  "espeak": {
118
119
  "voice": config.get("lang_code", "")
119
120
  },
@@ -518,7 +518,10 @@ def cli(
518
518
  if prev_config:
519
519
  with open(prev_config) as f:
520
520
  cfg = json.load(f)
521
- prev_phoneme_id_map = cfg["phoneme_id_map"]
521
+ # flatten list, same models (eg. piper) use a list of ids
522
+ prev_phoneme_id_map = {k: v if not isinstance(v, list) else v[0]
523
+ for k, v in cfg["phoneme_id_map"].items()}
524
+
522
525
  prev_num_symbols = cfg.get("num_symbols", MAX_PHONEMES)
523
526
  _LOGGER.info(f"Loaded phoneme map from previous config: '{prev_config}'")
524
527
  all_phonemes.update(prev_phoneme_id_map.keys())