phoonnx 0.2.6a2__tar.gz → 0.2.7a1__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/PKG-INFO +1 -1
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/version.py +2 -2
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx.egg-info/PKG-INFO +1 -1
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx_train/preprocess.py +23 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/README.md +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/__init__.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/config.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/locale/ca/phonetic_spellings.txt +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/locale/en/phonetic_spellings.txt +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/locale/gl/phonetic_spellings.txt +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/locale/pt/phonetic_spellings.txt +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/phoneme_ids.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/phonemizers/__init__.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/phonemizers/ar.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/phonemizers/base.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/phonemizers/en.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/phonemizers/fa.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/phonemizers/gl.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/phonemizers/he.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/phonemizers/ja.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/phonemizers/ko.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/phonemizers/mul.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/phonemizers/mwl.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/phonemizers/vi.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/phonemizers/zh.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/thirdparty/__init__.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/thirdparty/arpa2ipa.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/thirdparty/bw2ipa.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/thirdparty/cotovia/cotovia_aarch64 +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/thirdparty/cotovia/cotovia_x86_64 +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/thirdparty/hangul2ipa.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/thirdparty/ko_tables/aspiration.csv +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/thirdparty/ko_tables/assimilation.csv +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/thirdparty/ko_tables/double_coda.csv +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/thirdparty/ko_tables/hanja.tsv +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/thirdparty/ko_tables/ipa.csv +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/thirdparty/ko_tables/neutralization.csv +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/thirdparty/ko_tables/tensification.csv +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/thirdparty/ko_tables/yale.csv +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/thirdparty/kog2p/__init__.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/thirdparty/kog2p/rulebook.txt +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/thirdparty/mantoq/__init__.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/thirdparty/mantoq/buck/__init__.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/thirdparty/mantoq/buck/phonetise_buckwalter.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/thirdparty/mantoq/buck/symbols.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/thirdparty/mantoq/buck/tokenization.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/thirdparty/mantoq/num2words.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/thirdparty/mantoq/pyarabic/__init__.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/thirdparty/mantoq/pyarabic/arabrepr.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/thirdparty/mantoq/pyarabic/araby.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/thirdparty/mantoq/pyarabic/named_const.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/thirdparty/mantoq/pyarabic/normalize.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/thirdparty/mantoq/pyarabic/number.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/thirdparty/mantoq/pyarabic/number_const.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/thirdparty/mantoq/pyarabic/stack.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/thirdparty/mantoq/pyarabic/trans.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/thirdparty/mantoq/unicode_symbol2label.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/thirdparty/phonikud/__init__.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/thirdparty/tashkeel/LICENSE +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/thirdparty/tashkeel/SOURCE +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/thirdparty/tashkeel/__init__.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/thirdparty/tashkeel/hint_id_map.json +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/thirdparty/tashkeel/input_id_map.json +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/thirdparty/tashkeel/model.onnx +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/thirdparty/tashkeel/target_id_map.json +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/thirdparty/zh_num.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/util.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx/voice.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx.egg-info/SOURCES.txt +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx.egg-info/dependency_links.txt +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx.egg-info/requires.txt +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx.egg-info/top_level.txt +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx_train/export_onnx.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx_train/norm_audio/__init__.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx_train/norm_audio/trim.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx_train/norm_audio/vad.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx_train/train.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx_train/vits/__init__.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx_train/vits/attentions.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx_train/vits/commons.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx_train/vits/config.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx_train/vits/dataset.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx_train/vits/lightning.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx_train/vits/losses.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx_train/vits/mel_processing.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx_train/vits/models.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx_train/vits/modules.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx_train/vits/monotonic_align/__init__.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx_train/vits/monotonic_align/setup.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx_train/vits/transforms.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx_train/vits/utils.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/phoonnx_train/vits/wavfile.py +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/setup.cfg +0 -0
- {phoonnx-0.2.6a2 → phoonnx-0.2.7a1}/setup.py +0 -0
@@ -377,6 +377,16 @@ def phonemize_worker(
|
|
377
377
|
is_flag=True,
|
378
378
|
help="Add diacritics to text (phonemizer specific, e.g., to denote stress).",
|
379
379
|
)
|
380
|
+
@click.option(
|
381
|
+
"--jsonl-audio-path",
|
382
|
+
default=None,
|
383
|
+
help="override audio_path base directory (everything before '/wav') in generated dataset.jsonl"
|
384
|
+
)
|
385
|
+
@click.option(
|
386
|
+
"--jsonl-audio-spec-path",
|
387
|
+
default=None,
|
388
|
+
help="override audio_norm_path/audio_spec_path base directory (everything before '/cache') in generated dataset.jsonl"
|
389
|
+
)
|
380
390
|
def cli(
|
381
391
|
input_dir: Path,
|
382
392
|
output_dir: Path,
|
@@ -397,6 +407,8 @@ def cli(
|
|
397
407
|
skip_audio: bool,
|
398
408
|
debug: bool,
|
399
409
|
add_diacritics: bool,
|
410
|
+
jsonl_audio_path: Optional[str],
|
411
|
+
jsonl_audio_spec_path: Optional[str],
|
400
412
|
) -> None:
|
401
413
|
"""
|
402
414
|
Preprocess a TTS dataset (e.g., LJSpeech format) for training a VITS-style model.
|
@@ -609,6 +621,17 @@ def cli(
|
|
609
621
|
_LOGGER.warning("Skipping utterance with invalid phoneme_ids before writing: %s", utt.audio_path)
|
610
622
|
continue
|
611
623
|
|
624
|
+
# apply path overrides if needed
|
625
|
+
# this allows pre-processing the dataset in one system and then train in other
|
626
|
+
if jsonl_audio_path:
|
627
|
+
base_path, fname = str(utt.audio_path).split("/wav/")
|
628
|
+
utt.audio_path = Path(f"{jsonl_audio_path}/wav/{fname}")
|
629
|
+
if jsonl_audio_spec_path:
|
630
|
+
base_path, fname = str(utt.audio_norm_path).split("/cache/")
|
631
|
+
utt.audio_norm_path = Path(f"{jsonl_audio_spec_path}/cache/{fname}")
|
632
|
+
base_path, fname = str(utt.audio_spec_path).split("/cache/")
|
633
|
+
utt.audio_spec_path = Path(f"{jsonl_audio_spec_path}/cache/{fname}")
|
634
|
+
|
612
635
|
json.dump(
|
613
636
|
utt.asdict(),
|
614
637
|
dataset_file,
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|