Audyn 0.0.1.dev1__tar.gz → 0.0.1.dev7__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {Audyn-0.0.1.dev1 → audyn-0.0.1.dev7}/Audyn.egg-info/PKG-INFO +43 -1
- audyn-0.0.1.dev7/Audyn.egg-info/SOURCES.txt +193 -0
- {Audyn-0.0.1.dev1 → audyn-0.0.1.dev7}/Audyn.egg-info/requires.txt +12 -0
- {Audyn-0.0.1.dev1 → audyn-0.0.1.dev7}/MANIFEST.in +2 -1
- {Audyn-0.0.1.dev1 → audyn-0.0.1.dev7}/PKG-INFO +43 -1
- audyn-0.0.1.dev7/README.md +64 -0
- audyn-0.0.1.dev7/audyn/__init__.py +61 -0
- audyn-0.0.1.dev7/audyn/criterion/__init__.py +6 -0
- {Audyn-0.0.1.dev1 → audyn-0.0.1.dev7}/audyn/criterion/base.py +5 -5
- audyn-0.0.1.dev7/audyn/criterion/contrastive.py +698 -0
- audyn-0.0.1.dev7/audyn/criterion/distance.py +123 -0
- {Audyn-0.0.1.dev1 → audyn-0.0.1.dev7}/audyn/criterion/flow.py +37 -4
- audyn-0.0.1.dev7/audyn/criterion/gan.py +49 -0
- audyn-0.0.1.dev7/audyn/criterion/glowtts.py +96 -0
- {Audyn-0.0.1.dev1 → audyn-0.0.1.dev7}/audyn/criterion/hifigan.py +20 -1
- {Audyn-0.0.1.dev1 → audyn-0.0.1.dev7}/audyn/criterion/melspectrogram.py +13 -1
- audyn-0.0.1.dev7/audyn/criterion/rvqvae.py +91 -0
- audyn-0.0.1.dev7/audyn/criterion/ssast.py +108 -0
- audyn-0.0.1.dev7/audyn/criterion/vqvae.py +95 -0
- audyn-0.0.1.dev7/audyn/functional/__init__.py +3 -0
- audyn-0.0.1.dev7/audyn/functional/activation.py +119 -0
- audyn-0.0.1.dev7/audyn/functional/clustering.py +237 -0
- audyn-0.0.1.dev7/audyn/functional/vector_quantization.py +97 -0
- audyn-0.0.1.dev7/audyn/metrics/__init__.py +62 -0
- audyn-0.0.1.dev7/audyn/metrics/base.py +98 -0
- audyn-0.0.1.dev7/audyn/metrics/crossmodal.py +191 -0
- audyn-0.0.1.dev7/audyn/metrics/retrieval.py +182 -0
- audyn-0.0.1.dev7/audyn/models/__init__.py +53 -0
- audyn-0.0.1.dev7/audyn/models/ast.py +686 -0
- audyn-0.0.1.dev7/audyn/models/encodec.py +470 -0
- {Audyn-0.0.1.dev1 → audyn-0.0.1.dev7}/audyn/models/fastspeech.py +236 -88
- audyn-0.0.1.dev7/audyn/models/glowtts.py +1111 -0
- {Audyn-0.0.1.dev1 → audyn-0.0.1.dev7}/audyn/models/hifigan.py +10 -0
- audyn-0.0.1.dev7/audyn/models/lextransformer.py +449 -0
- audyn-0.0.1.dev7/audyn/models/passt.py +237 -0
- audyn-0.0.1.dev7/audyn/models/pixelsnail.py +203 -0
- audyn-0.0.1.dev7/audyn/models/roformer.py +468 -0
- audyn-0.0.1.dev7/audyn/models/rvqvae.py +235 -0
- audyn-0.0.1.dev7/audyn/models/soundstream.py +737 -0
- audyn-0.0.1.dev7/audyn/models/ssast.py +1008 -0
- {Audyn-0.0.1.dev1 → audyn-0.0.1.dev7}/audyn/models/text_to_wave.py +57 -50
- audyn-0.0.1.dev7/audyn/models/vae.py +24 -0
- audyn-0.0.1.dev7/audyn/models/vqvae.py +183 -0
- {Audyn-0.0.1.dev1 → audyn-0.0.1.dev7}/audyn/models/waveglow.py +63 -52
- {Audyn-0.0.1.dev1 → audyn-0.0.1.dev7}/audyn/models/wavenet.py +63 -36
- audyn-0.0.1.dev7/audyn/modules/activation.py +1166 -0
- {Audyn-0.0.1.dev1 → audyn-0.0.1.dev7}/audyn/modules/duration_predictor.py +40 -10
- audyn-0.0.1.dev7/audyn/modules/encodec.py +329 -0
- {Audyn-0.0.1.dev1 → audyn-0.0.1.dev7}/audyn/modules/fastspeech.py +4 -12
- {Audyn-0.0.1.dev1 → audyn-0.0.1.dev7}/audyn/modules/flow.py +4 -6
- {Audyn-0.0.1.dev1 → audyn-0.0.1.dev7}/audyn/modules/glow.py +133 -27
- {Audyn-0.0.1.dev1 → audyn-0.0.1.dev7}/audyn/modules/glowtts.py +363 -47
- audyn-0.0.1.dev7/audyn/modules/passt.py +574 -0
- audyn-0.0.1.dev7/audyn/modules/pixelcnn.py +319 -0
- audyn-0.0.1.dev7/audyn/modules/pixelsnail.py +545 -0
- audyn-0.0.1.dev7/audyn/modules/positional_encoding.py +219 -0
- audyn-0.0.1.dev7/audyn/modules/rvq.py +156 -0
- audyn-0.0.1.dev7/audyn/modules/soundstream.py +307 -0
- audyn-0.0.1.dev7/audyn/modules/vit.py +468 -0
- audyn-0.0.1.dev7/audyn/modules/vq.py +245 -0
- audyn-0.0.1.dev7/audyn/modules/vqvae.py +5 -0
- {Audyn-0.0.1.dev1 → audyn-0.0.1.dev7}/audyn/modules/waveglow.py +28 -28
- {Audyn-0.0.1.dev1 → audyn-0.0.1.dev7}/audyn/modules/wavenet.py +34 -34
- audyn-0.0.1.dev7/audyn/optim/lr_scheduler.py +211 -0
- audyn-0.0.1.dev7/audyn/optim/optimizer.py +1447 -0
- audyn-0.0.1.dev7/audyn/transforms/__init__.py +23 -0
- audyn-0.0.1.dev7/audyn/transforms/ast.py +185 -0
- audyn-0.0.1.dev7/audyn/transforms/birdclef.py +168 -0
- audyn-0.0.1.dev7/audyn/transforms/cqt.py +705 -0
- audyn-0.0.1.dev7/audyn/transforms/hifigan.py +95 -0
- audyn-0.0.1.dev7/audyn/transforms/hubert.py +59 -0
- audyn-0.0.1.dev7/audyn/transforms/kaldi.py +461 -0
- audyn-0.0.1.dev7/audyn/transforms/librosa.py +83 -0
- audyn-0.0.1.dev7/audyn/utils/__init__.py +628 -0
- {Audyn-0.0.1.dev1 → audyn-0.0.1.dev7}/audyn/utils/alignment/__init__.py +10 -3
- audyn-0.0.1.dev7/audyn/utils/alignment/monotonic_align.py +66 -0
- audyn-0.0.1.dev7/audyn/utils/clip_grad.py +171 -0
- {Audyn-0.0.1.dev1 → audyn-0.0.1.dev7}/audyn/utils/data/__init__.py +13 -51
- audyn-0.0.1.dev7/audyn/utils/data/audioset/__init__.py +9 -0
- audyn-0.0.1.dev7/audyn/utils/data/audioset/_download.py +53 -0
- audyn-0.0.1.dev7/audyn/utils/data/audioset/ast.py +7 -0
- audyn-0.0.1.dev7/audyn/utils/data/audioset/composer.py +190 -0
- audyn-0.0.1.dev7/audyn/utils/data/audioset/dataset.py +516 -0
- audyn-0.0.1.dev7/audyn/utils/data/audioset/distributed.py +105 -0
- audyn-0.0.1.dev7/audyn/utils/data/audioset/sampler.py +102 -0
- audyn-0.0.1.dev7/audyn/utils/data/birdclef/_common/__init__.py +81 -0
- audyn-0.0.1.dev7/audyn/utils/data/birdclef/birdclef2022/__init__.py +67 -0
- audyn-0.0.1.dev7/audyn/utils/data/birdclef/birdclef2022/_download.py +36 -0
- audyn-0.0.1.dev7/audyn/utils/data/birdclef/birdclef2024/__init__.py +122 -0
- audyn-0.0.1.dev7/audyn/utils/data/birdclef/birdclef2024/_download.py +36 -0
- audyn-0.0.1.dev7/audyn/utils/data/birdclef/birdclef2024/collator.py +54 -0
- audyn-0.0.1.dev7/audyn/utils/data/birdclef/birdclef2024/composer.py +292 -0
- audyn-0.0.1.dev7/audyn/utils/data/birdclef/birdclef2024/dataset.py +217 -0
- audyn-0.0.1.dev7/audyn/utils/data/birdclef/birdclef2024/models/baseline.py +65 -0
- audyn-0.0.1.dev7/audyn/utils/data/clotho/__init__.py +37 -0
- audyn-0.0.1.dev7/audyn/utils/data/clotho/text/indexing.py +113 -0
- audyn-0.0.1.dev7/audyn/utils/data/clotho/text/normalization.py +27 -0
- audyn-0.0.1.dev7/audyn/utils/data/clotho/text/symbols.py +9 -0
- audyn-0.0.1.dev7/audyn/utils/data/clotho/text/tokenization.py +25 -0
- audyn-0.0.1.dev7/audyn/utils/data/cmudict/__init__.py +223 -0
- audyn-0.0.1.dev7/audyn/utils/data/cmudict/indexing.py +39 -0
- audyn-0.0.1.dev7/audyn/utils/data/collator.py +126 -0
- audyn-0.0.1.dev7/audyn/utils/data/composer.py +135 -0
- {Audyn-0.0.1.dev1 → audyn-0.0.1.dev7}/audyn/utils/data/dataloader.py +72 -40
- audyn-0.0.1.dev7/audyn/utils/data/dataset.py +196 -0
- audyn-0.0.1.dev7/audyn/utils/data/postprocess.py +320 -0
- {Audyn-0.0.1.dev1 → audyn-0.0.1.dev7}/audyn/utils/data/sampler.py +4 -1
- audyn-0.0.1.dev7/audyn/utils/data/tacotron/__init__.py +30 -0
- audyn-0.0.1.dev7/audyn/utils/data/tacotron/text/indexing.py +33 -0
- audyn-0.0.1.dev7/audyn/utils/data/tacotron/text/normalization.py +118 -0
- audyn-0.0.1.dev7/audyn/utils/data/tacotron/text/numbers.py +83 -0
- audyn-0.0.1.dev7/audyn/utils/data/tacotron/text/symbols.py +90 -0
- audyn-0.0.1.dev7/audyn/utils/data/tacotron/text/tokenization.py +26 -0
- audyn-0.0.1.dev7/audyn/utils/data/webdataset.py +72 -0
- {Audyn-0.0.1.dev1 → audyn-0.0.1.dev7}/audyn/utils/distributed/__init__.py +8 -1
- {Audyn-0.0.1.dev1 → audyn-0.0.1.dev7}/audyn/utils/driver/__init__.py +4 -2
- audyn-0.0.1.dev7/audyn/utils/driver/_conf_template/config.yaml +15 -0
- audyn-0.0.1.dev7/audyn/utils/driver/_conf_template/criterion/cross_entropy.yaml +15 -0
- audyn-0.0.1.dev7/audyn/utils/driver/_conf_template/criterion/vqvae.yaml +34 -0
- audyn-0.0.1.dev7/audyn/utils/driver/_conf_template/data/defaults.yaml +2 -0
- audyn-0.0.1.dev7/audyn/utils/driver/_conf_template/lr_scheduler/defaults.yaml +0 -0
- audyn-0.0.1.dev7/audyn/utils/driver/_conf_template/lr_scheduler/none.yaml +0 -0
- audyn-0.0.1.dev7/audyn/utils/driver/_conf_template/lr_scheduler/transformer.yaml +3 -0
- audyn-0.0.1.dev7/audyn/utils/driver/_conf_template/model/defaults.yaml +0 -0
- audyn-0.0.1.dev7/audyn/utils/driver/_conf_template/model/gan.yaml +2 -0
- audyn-0.0.1.dev7/audyn/utils/driver/_conf_template/optimizer/adam.yaml +1 -0
- audyn-0.0.1.dev7/audyn/utils/driver/_conf_template/optimizer/adam_ema.yaml +5 -0
- audyn-0.0.1.dev7/audyn/utils/driver/_conf_template/optimizer/adamw.yaml +1 -0
- audyn-0.0.1.dev7/audyn/utils/driver/_conf_template/optimizer/gan.yaml +2 -0
- audyn-0.0.1.dev7/audyn/utils/driver/_conf_template/preprocess/defaults.yaml +6 -0
- audyn-0.0.1.dev7/audyn/utils/driver/_conf_template/preprocess/ljspeech_text-to-feat.yaml +6 -0
- audyn-0.0.1.dev7/audyn/utils/driver/_conf_template/preprocess/text-to-feat.yaml +5 -0
- audyn-0.0.1.dev7/audyn/utils/driver/_conf_template/preprocess/text-to-wave.yaml +5 -0
- audyn-0.0.1.dev7/audyn/utils/driver/_conf_template/system/cpu.yaml +11 -0
- audyn-0.0.1.dev7/audyn/utils/driver/_conf_template/system/cuda.yaml +11 -0
- audyn-0.0.1.dev7/audyn/utils/driver/_conf_template/system/cuda_amp.yaml +11 -0
- audyn-0.0.1.dev7/audyn/utils/driver/_conf_template/system/cuda_ddp.yaml +11 -0
- audyn-0.0.1.dev7/audyn/utils/driver/_conf_template/system/cuda_ddp_amp.yaml +11 -0
- audyn-0.0.1.dev7/audyn/utils/driver/_conf_template/system/defaults.yaml +11 -0
- audyn-0.0.1.dev7/audyn/utils/driver/_conf_template/system/mps.yaml +11 -0
- audyn-0.0.1.dev7/audyn/utils/driver/_conf_template/test/dataloader/defaults.yaml +4 -0
- audyn-0.0.1.dev7/audyn/utils/driver/_conf_template/test/dataset/defaults.yaml +3 -0
- audyn-0.0.1.dev7/audyn/utils/driver/_conf_template/test/dataset/torch.yaml +4 -0
- audyn-0.0.1.dev7/audyn/utils/driver/_conf_template/test/defaults.yaml +28 -0
- audyn-0.0.1.dev7/audyn/utils/driver/_conf_template/test/text_to_wave.yaml +36 -0
- audyn-0.0.1.dev7/audyn/utils/driver/_conf_template/train/clip_gradient/defaults.yaml +0 -0
- audyn-0.0.1.dev7/audyn/utils/driver/_conf_template/train/clip_gradient/gan.yaml +6 -0
- audyn-0.0.1.dev7/audyn/utils/driver/_conf_template/train/dataloader/defaults.yaml +8 -0
- audyn-0.0.1.dev7/audyn/utils/driver/_conf_template/train/dataloader/sequential-batch.yaml +9 -0
- audyn-0.0.1.dev7/audyn/utils/driver/_conf_template/train/dataset/defaults.yaml +6 -0
- audyn-0.0.1.dev7/audyn/utils/driver/_conf_template/train/dataset/sortable-torch.yaml +9 -0
- audyn-0.0.1.dev7/audyn/utils/driver/_conf_template/train/dataset/torch.yaml +8 -0
- audyn-0.0.1.dev7/audyn/utils/driver/_conf_template/train/dataset/webdataset.yaml +8 -0
- audyn-0.0.1.dev7/audyn/utils/driver/_conf_template/train/defaults.yaml +35 -0
- audyn-0.0.1.dev7/audyn/utils/driver/_conf_template/train/gan.yaml +51 -0
- audyn-0.0.1.dev7/audyn/utils/driver/_conf_template/train/record/defaults.yaml +0 -0
- audyn-0.0.1.dev7/audyn/utils/driver/_conf_template/train/record/template.yaml +58 -0
- audyn-0.0.1.dev7/audyn/utils/driver/_conf_template/train/template.yaml +45 -0
- audyn-0.0.1.dev7/audyn/utils/driver/_conf_template/train/text-to-feat+pretrained_feat-to-wave.yaml +51 -0
- audyn-0.0.1.dev7/audyn/utils/driver/base.py +2585 -0
- {Audyn-0.0.1.dev1 → audyn-0.0.1.dev7}/audyn/utils/driver/feat_to_wave.py +4 -1
- {Audyn-0.0.1.dev1 → audyn-0.0.1.dev7}/audyn/utils/driver/gan.py +357 -339
- audyn-0.0.1.dev7/audyn/utils/driver/text_to_feat.py +461 -0
- {Audyn-0.0.1.dev1 → audyn-0.0.1.dev7}/audyn/utils/driver/text_to_wave.py +34 -9
- audyn-0.0.1.dev7/audyn/utils/duration/__init__.py +44 -0
- audyn-0.0.1.dev7/audyn/utils/github/__init__.py +133 -0
- audyn-0.0.1.dev7/audyn/utils/hydra/utils.py +515 -0
- audyn-0.0.1.dev7/audyn/utils/lab/__init__.py +17 -0
- audyn-0.0.1.dev7/audyn/utils/model/__init__.py +68 -0
- audyn-0.0.1.dev7/audyn/utils/music/__init__.py +66 -0
- audyn-0.0.1.dev7/audyn/utils/text/__init__.py +272 -0
- audyn-0.0.1.dev7/audyn/utils/text/indexing.py +22 -0
- audyn-0.0.1.dev7/audyn/utils/text/normalization.py +22 -0
- audyn-0.0.1.dev7/audyn/utils/text/pronunciation.py +49 -0
- audyn-0.0.1.dev7/audyn/utils/text/tokenization.py +57 -0
- audyn-0.0.1.dev7/cpp_extensions/monotonic_align/monotonic_align.cpp +96 -0
- {Audyn-0.0.1.dev1 → audyn-0.0.1.dev7}/pyproject.toml +18 -1
- audyn-0.0.1.dev7/setup.py +149 -0
- Audyn-0.0.1.dev1/Audyn.egg-info/SOURCES.txt +0 -65
- Audyn-0.0.1.dev1/README.md +0 -31
- Audyn-0.0.1.dev1/audyn/__init__.py +0 -19
- Audyn-0.0.1.dev1/audyn/criterion/gan.py +0 -9
- Audyn-0.0.1.dev1/audyn/models/__init__.py +0 -12
- Audyn-0.0.1.dev1/audyn/models/glowtts.py +0 -675
- Audyn-0.0.1.dev1/audyn/modules/positional_encoding.py +0 -58
- Audyn-0.0.1.dev1/audyn/optim/lr_scheduler.py +0 -38
- Audyn-0.0.1.dev1/audyn/optim/optimizer.py +0 -295
- Audyn-0.0.1.dev1/audyn/utils/__init__.py +0 -41
- Audyn-0.0.1.dev1/audyn/utils/alignment/monotonic_align.py +0 -26
- Audyn-0.0.1.dev1/audyn/utils/data/cmudict/__init__.py +0 -92
- Audyn-0.0.1.dev1/audyn/utils/data/dataset.py +0 -62
- Audyn-0.0.1.dev1/audyn/utils/data/postprocess.py +0 -231
- Audyn-0.0.1.dev1/audyn/utils/driver/base.py +0 -1568
- Audyn-0.0.1.dev1/audyn/utils/driver/text_to_feat.py +0 -31
- Audyn-0.0.1.dev1/audyn/utils/hydra/utils.py +0 -104
- Audyn-0.0.1.dev1/audyn/utils/model/__init__.py +0 -21
- Audyn-0.0.1.dev1/cpp_extensions/monotonic_align/monotonic_align.cpp +0 -108
- Audyn-0.0.1.dev1/setup.py +0 -32
- {Audyn-0.0.1.dev1 → audyn-0.0.1.dev7}/Audyn.egg-info/dependency_links.txt +0 -0
- {Audyn-0.0.1.dev1 → audyn-0.0.1.dev7}/Audyn.egg-info/top_level.txt +0 -0
- {Audyn-0.0.1.dev1 → audyn-0.0.1.dev7}/LICENSE +0 -0
- {Audyn-0.0.1.dev1 → audyn-0.0.1.dev7}/audyn/criterion/autoregressive.py +0 -0
- {Audyn-0.0.1.dev1 → audyn-0.0.1.dev7}/audyn/criterion/fastspeech.py +0 -0
- {Audyn-0.0.1.dev1 → audyn-0.0.1.dev7}/audyn/criterion/lsgan.py +0 -0
- {Audyn-0.0.1.dev1 → audyn-0.0.1.dev7}/audyn/models/gan.py +0 -0
- {Audyn-0.0.1.dev1 → audyn-0.0.1.dev7}/audyn/modules/film.py +0 -0
- {Audyn-0.0.1.dev1 → audyn-0.0.1.dev7}/audyn/modules/normalization.py +0 -0
- {Audyn-0.0.1.dev1 → audyn-0.0.1.dev7}/audyn/utils/data/distributed.py +0 -0
- {Audyn-0.0.1.dev1 → audyn-0.0.1.dev7}/audyn/utils/driver/_decorator.py +0 -0
- {Audyn-0.0.1.dev1 → audyn-0.0.1.dev7}/audyn/utils/hydra/__init__.py +0 -0
- {Audyn-0.0.1.dev1 → audyn-0.0.1.dev7}/audyn/utils/logging/__init__.py +0 -0
- {Audyn-0.0.1.dev1 → audyn-0.0.1.dev7}/audyn/utils/parallel/__init__.py +0 -0
- {Audyn-0.0.1.dev1 → audyn-0.0.1.dev7}/audyn/utils/tensorboard/__init__.py +0 -0
- {Audyn-0.0.1.dev1 → audyn-0.0.1.dev7}/audyn/utils/textgrid/__init__.py +0 -0
- {Audyn-0.0.1.dev1 → audyn-0.0.1.dev7}/setup.cfg +0 -0
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.1
|
|
2
2
|
Name: Audyn
|
|
3
|
-
Version: 0.0.1.
|
|
3
|
+
Version: 0.0.1.dev7
|
|
4
4
|
Summary: A PyTorch toolkit for audio synthesis.
|
|
5
5
|
Author: Takuya Hasumi
|
|
6
6
|
License: Apache License
|
|
@@ -209,6 +209,7 @@ Project-URL: url, https://github.com/tky823/Audyn
|
|
|
209
209
|
Requires-Python: <4,>=3.8
|
|
210
210
|
Description-Content-Type: text/markdown
|
|
211
211
|
License-File: LICENSE
|
|
212
|
+
Requires-Dist: importlib_resources<6.2; python_version == "3.8"
|
|
212
213
|
Requires-Dist: omegaconf
|
|
213
214
|
Requires-Dist: hydra-core
|
|
214
215
|
Requires-Dist: matplotlib
|
|
@@ -217,17 +218,27 @@ Requires-Dist: torchaudio
|
|
|
217
218
|
Requires-Dist: torchtext
|
|
218
219
|
Requires-Dist: torchvision
|
|
219
220
|
Requires-Dist: tensorboard
|
|
221
|
+
Requires-Dist: webdataset
|
|
222
|
+
Requires-Dist: inflect
|
|
220
223
|
Provides-Extra: recipes
|
|
221
224
|
Requires-Dist: tqdm; extra == "recipes"
|
|
222
225
|
Provides-Extra: dev
|
|
223
226
|
Requires-Dist: flake8; extra == "dev"
|
|
224
227
|
Requires-Dist: black; extra == "dev"
|
|
225
228
|
Requires-Dist: isort; extra == "dev"
|
|
229
|
+
Provides-Extra: docs
|
|
230
|
+
Requires-Dist: sphinx; extra == "docs"
|
|
231
|
+
Requires-Dist: sphinx-autodoc-typehints; extra == "docs"
|
|
232
|
+
Requires-Dist: sphinx-autobuild; extra == "docs"
|
|
233
|
+
Requires-Dist: nbsphinx; extra == "docs"
|
|
234
|
+
Requires-Dist: furo; extra == "docs"
|
|
226
235
|
Provides-Extra: tests
|
|
227
236
|
Requires-Dist: pytest; extra == "tests"
|
|
228
237
|
Requires-Dist: pytest-cov; extra == "tests"
|
|
229
238
|
|
|
230
239
|
# Audyn
|
|
240
|
+
[](https://codecov.io/gh/tky823/Audyn)
|
|
241
|
+
|
|
231
242
|
Audyn is PyTorch toolkit for audio synthesis.
|
|
232
243
|
|
|
233
244
|
## Installation
|
|
@@ -248,12 +259,43 @@ If you need to run recipes, add `[recipes]` as follows:
|
|
|
248
259
|
pip install -e ".[recipes]"
|
|
249
260
|
```
|
|
250
261
|
|
|
262
|
+
If you use MacOS, you may need to set `MACOSX_DEPLOYMENT_TARGET` during installation to build C++ related modules.
|
|
263
|
+
|
|
264
|
+
### C++ extension
|
|
265
|
+
We use [C++ extension](https://pytorch.org/tutorials/advanced/cpp_extension.html) to search monotonic alignment in some models (e.g. GlowTTS).
|
|
266
|
+
To take full advantage of computational efficiency, set appropriate value of `OMP_NUM_THREADS` and `CXX` during installation:
|
|
267
|
+
|
|
268
|
+
```shell
|
|
269
|
+
# In Audyn/
|
|
270
|
+
export CXX=<PATH/TO/CPP/COMPILER> # e.g. /usr/bin/c++
|
|
271
|
+
export OMP_NUM_THREADS=<SUITABLE/VALUE/FOR/ENVIRONMENT>
|
|
272
|
+
pip install -e "."
|
|
273
|
+
```
|
|
274
|
+
|
|
251
275
|
## Development
|
|
252
276
|
```shell
|
|
253
277
|
# In Audyn/
|
|
254
278
|
pip install -e ".[recipes,dev,tests]"
|
|
255
279
|
```
|
|
256
280
|
|
|
281
|
+
## Build Documentation Locally (optional)
|
|
282
|
+
To build the documentation locally, you have to include `docs` when installing `Audyn`.
|
|
283
|
+
```shell
|
|
284
|
+
pip install -e ".[docs]"
|
|
285
|
+
```
|
|
286
|
+
|
|
287
|
+
When you build the documentation, run the following command.
|
|
288
|
+
```shell
|
|
289
|
+
cd docs/
|
|
290
|
+
make html
|
|
291
|
+
```
|
|
292
|
+
|
|
293
|
+
Or, you can build the documentation automatically using `sphinx-autobuild`.
|
|
294
|
+
```shell
|
|
295
|
+
# in Audyn/
|
|
296
|
+
sphinx-autobuild docs docs/_build/html
|
|
297
|
+
```
|
|
298
|
+
|
|
257
299
|
## Test
|
|
258
300
|
```shell
|
|
259
301
|
pytest tests/package
|
|
@@ -0,0 +1,193 @@
|
|
|
1
|
+
LICENSE
|
|
2
|
+
MANIFEST.in
|
|
3
|
+
README.md
|
|
4
|
+
pyproject.toml
|
|
5
|
+
setup.py
|
|
6
|
+
Audyn.egg-info/PKG-INFO
|
|
7
|
+
Audyn.egg-info/SOURCES.txt
|
|
8
|
+
Audyn.egg-info/dependency_links.txt
|
|
9
|
+
Audyn.egg-info/requires.txt
|
|
10
|
+
Audyn.egg-info/top_level.txt
|
|
11
|
+
audyn/__init__.py
|
|
12
|
+
audyn/criterion/__init__.py
|
|
13
|
+
audyn/criterion/autoregressive.py
|
|
14
|
+
audyn/criterion/base.py
|
|
15
|
+
audyn/criterion/contrastive.py
|
|
16
|
+
audyn/criterion/distance.py
|
|
17
|
+
audyn/criterion/fastspeech.py
|
|
18
|
+
audyn/criterion/flow.py
|
|
19
|
+
audyn/criterion/gan.py
|
|
20
|
+
audyn/criterion/glowtts.py
|
|
21
|
+
audyn/criterion/hifigan.py
|
|
22
|
+
audyn/criterion/lsgan.py
|
|
23
|
+
audyn/criterion/melspectrogram.py
|
|
24
|
+
audyn/criterion/rvqvae.py
|
|
25
|
+
audyn/criterion/ssast.py
|
|
26
|
+
audyn/criterion/vqvae.py
|
|
27
|
+
audyn/functional/__init__.py
|
|
28
|
+
audyn/functional/activation.py
|
|
29
|
+
audyn/functional/clustering.py
|
|
30
|
+
audyn/functional/vector_quantization.py
|
|
31
|
+
audyn/metrics/__init__.py
|
|
32
|
+
audyn/metrics/base.py
|
|
33
|
+
audyn/metrics/crossmodal.py
|
|
34
|
+
audyn/metrics/retrieval.py
|
|
35
|
+
audyn/models/__init__.py
|
|
36
|
+
audyn/models/ast.py
|
|
37
|
+
audyn/models/encodec.py
|
|
38
|
+
audyn/models/fastspeech.py
|
|
39
|
+
audyn/models/gan.py
|
|
40
|
+
audyn/models/glowtts.py
|
|
41
|
+
audyn/models/hifigan.py
|
|
42
|
+
audyn/models/lextransformer.py
|
|
43
|
+
audyn/models/passt.py
|
|
44
|
+
audyn/models/pixelsnail.py
|
|
45
|
+
audyn/models/roformer.py
|
|
46
|
+
audyn/models/rvqvae.py
|
|
47
|
+
audyn/models/soundstream.py
|
|
48
|
+
audyn/models/ssast.py
|
|
49
|
+
audyn/models/text_to_wave.py
|
|
50
|
+
audyn/models/vae.py
|
|
51
|
+
audyn/models/vqvae.py
|
|
52
|
+
audyn/models/waveglow.py
|
|
53
|
+
audyn/models/wavenet.py
|
|
54
|
+
audyn/modules/activation.py
|
|
55
|
+
audyn/modules/duration_predictor.py
|
|
56
|
+
audyn/modules/encodec.py
|
|
57
|
+
audyn/modules/fastspeech.py
|
|
58
|
+
audyn/modules/film.py
|
|
59
|
+
audyn/modules/flow.py
|
|
60
|
+
audyn/modules/glow.py
|
|
61
|
+
audyn/modules/glowtts.py
|
|
62
|
+
audyn/modules/normalization.py
|
|
63
|
+
audyn/modules/passt.py
|
|
64
|
+
audyn/modules/pixelcnn.py
|
|
65
|
+
audyn/modules/pixelsnail.py
|
|
66
|
+
audyn/modules/positional_encoding.py
|
|
67
|
+
audyn/modules/rvq.py
|
|
68
|
+
audyn/modules/soundstream.py
|
|
69
|
+
audyn/modules/vit.py
|
|
70
|
+
audyn/modules/vq.py
|
|
71
|
+
audyn/modules/vqvae.py
|
|
72
|
+
audyn/modules/waveglow.py
|
|
73
|
+
audyn/modules/wavenet.py
|
|
74
|
+
audyn/optim/lr_scheduler.py
|
|
75
|
+
audyn/optim/optimizer.py
|
|
76
|
+
audyn/transforms/__init__.py
|
|
77
|
+
audyn/transforms/ast.py
|
|
78
|
+
audyn/transforms/birdclef.py
|
|
79
|
+
audyn/transforms/cqt.py
|
|
80
|
+
audyn/transforms/hifigan.py
|
|
81
|
+
audyn/transforms/hubert.py
|
|
82
|
+
audyn/transforms/kaldi.py
|
|
83
|
+
audyn/transforms/librosa.py
|
|
84
|
+
audyn/utils/__init__.py
|
|
85
|
+
audyn/utils/clip_grad.py
|
|
86
|
+
audyn/utils/alignment/__init__.py
|
|
87
|
+
audyn/utils/alignment/monotonic_align.py
|
|
88
|
+
audyn/utils/data/__init__.py
|
|
89
|
+
audyn/utils/data/collator.py
|
|
90
|
+
audyn/utils/data/composer.py
|
|
91
|
+
audyn/utils/data/dataloader.py
|
|
92
|
+
audyn/utils/data/dataset.py
|
|
93
|
+
audyn/utils/data/distributed.py
|
|
94
|
+
audyn/utils/data/postprocess.py
|
|
95
|
+
audyn/utils/data/sampler.py
|
|
96
|
+
audyn/utils/data/webdataset.py
|
|
97
|
+
audyn/utils/data/audioset/__init__.py
|
|
98
|
+
audyn/utils/data/audioset/_download.py
|
|
99
|
+
audyn/utils/data/audioset/ast.py
|
|
100
|
+
audyn/utils/data/audioset/composer.py
|
|
101
|
+
audyn/utils/data/audioset/dataset.py
|
|
102
|
+
audyn/utils/data/audioset/distributed.py
|
|
103
|
+
audyn/utils/data/audioset/sampler.py
|
|
104
|
+
audyn/utils/data/birdclef/_common/__init__.py
|
|
105
|
+
audyn/utils/data/birdclef/birdclef2022/__init__.py
|
|
106
|
+
audyn/utils/data/birdclef/birdclef2022/_download.py
|
|
107
|
+
audyn/utils/data/birdclef/birdclef2024/__init__.py
|
|
108
|
+
audyn/utils/data/birdclef/birdclef2024/_download.py
|
|
109
|
+
audyn/utils/data/birdclef/birdclef2024/collator.py
|
|
110
|
+
audyn/utils/data/birdclef/birdclef2024/composer.py
|
|
111
|
+
audyn/utils/data/birdclef/birdclef2024/dataset.py
|
|
112
|
+
audyn/utils/data/birdclef/birdclef2024/models/baseline.py
|
|
113
|
+
audyn/utils/data/clotho/__init__.py
|
|
114
|
+
audyn/utils/data/clotho/text/indexing.py
|
|
115
|
+
audyn/utils/data/clotho/text/normalization.py
|
|
116
|
+
audyn/utils/data/clotho/text/symbols.py
|
|
117
|
+
audyn/utils/data/clotho/text/tokenization.py
|
|
118
|
+
audyn/utils/data/cmudict/__init__.py
|
|
119
|
+
audyn/utils/data/cmudict/indexing.py
|
|
120
|
+
audyn/utils/data/tacotron/__init__.py
|
|
121
|
+
audyn/utils/data/tacotron/text/indexing.py
|
|
122
|
+
audyn/utils/data/tacotron/text/normalization.py
|
|
123
|
+
audyn/utils/data/tacotron/text/numbers.py
|
|
124
|
+
audyn/utils/data/tacotron/text/symbols.py
|
|
125
|
+
audyn/utils/data/tacotron/text/tokenization.py
|
|
126
|
+
audyn/utils/distributed/__init__.py
|
|
127
|
+
audyn/utils/driver/__init__.py
|
|
128
|
+
audyn/utils/driver/_decorator.py
|
|
129
|
+
audyn/utils/driver/base.py
|
|
130
|
+
audyn/utils/driver/feat_to_wave.py
|
|
131
|
+
audyn/utils/driver/gan.py
|
|
132
|
+
audyn/utils/driver/text_to_feat.py
|
|
133
|
+
audyn/utils/driver/text_to_wave.py
|
|
134
|
+
audyn/utils/driver/_conf_template/config.yaml
|
|
135
|
+
audyn/utils/driver/_conf_template/criterion/cross_entropy.yaml
|
|
136
|
+
audyn/utils/driver/_conf_template/criterion/vqvae.yaml
|
|
137
|
+
audyn/utils/driver/_conf_template/data/defaults.yaml
|
|
138
|
+
audyn/utils/driver/_conf_template/lr_scheduler/defaults.yaml
|
|
139
|
+
audyn/utils/driver/_conf_template/lr_scheduler/none.yaml
|
|
140
|
+
audyn/utils/driver/_conf_template/lr_scheduler/transformer.yaml
|
|
141
|
+
audyn/utils/driver/_conf_template/model/defaults.yaml
|
|
142
|
+
audyn/utils/driver/_conf_template/model/gan.yaml
|
|
143
|
+
audyn/utils/driver/_conf_template/optimizer/adam.yaml
|
|
144
|
+
audyn/utils/driver/_conf_template/optimizer/adam_ema.yaml
|
|
145
|
+
audyn/utils/driver/_conf_template/optimizer/adamw.yaml
|
|
146
|
+
audyn/utils/driver/_conf_template/optimizer/gan.yaml
|
|
147
|
+
audyn/utils/driver/_conf_template/preprocess/defaults.yaml
|
|
148
|
+
audyn/utils/driver/_conf_template/preprocess/ljspeech_text-to-feat.yaml
|
|
149
|
+
audyn/utils/driver/_conf_template/preprocess/text-to-feat.yaml
|
|
150
|
+
audyn/utils/driver/_conf_template/preprocess/text-to-wave.yaml
|
|
151
|
+
audyn/utils/driver/_conf_template/system/cpu.yaml
|
|
152
|
+
audyn/utils/driver/_conf_template/system/cuda.yaml
|
|
153
|
+
audyn/utils/driver/_conf_template/system/cuda_amp.yaml
|
|
154
|
+
audyn/utils/driver/_conf_template/system/cuda_ddp.yaml
|
|
155
|
+
audyn/utils/driver/_conf_template/system/cuda_ddp_amp.yaml
|
|
156
|
+
audyn/utils/driver/_conf_template/system/defaults.yaml
|
|
157
|
+
audyn/utils/driver/_conf_template/system/mps.yaml
|
|
158
|
+
audyn/utils/driver/_conf_template/test/defaults.yaml
|
|
159
|
+
audyn/utils/driver/_conf_template/test/text_to_wave.yaml
|
|
160
|
+
audyn/utils/driver/_conf_template/test/dataloader/defaults.yaml
|
|
161
|
+
audyn/utils/driver/_conf_template/test/dataset/defaults.yaml
|
|
162
|
+
audyn/utils/driver/_conf_template/test/dataset/torch.yaml
|
|
163
|
+
audyn/utils/driver/_conf_template/train/defaults.yaml
|
|
164
|
+
audyn/utils/driver/_conf_template/train/gan.yaml
|
|
165
|
+
audyn/utils/driver/_conf_template/train/template.yaml
|
|
166
|
+
audyn/utils/driver/_conf_template/train/text-to-feat+pretrained_feat-to-wave.yaml
|
|
167
|
+
audyn/utils/driver/_conf_template/train/clip_gradient/defaults.yaml
|
|
168
|
+
audyn/utils/driver/_conf_template/train/clip_gradient/gan.yaml
|
|
169
|
+
audyn/utils/driver/_conf_template/train/dataloader/defaults.yaml
|
|
170
|
+
audyn/utils/driver/_conf_template/train/dataloader/sequential-batch.yaml
|
|
171
|
+
audyn/utils/driver/_conf_template/train/dataset/defaults.yaml
|
|
172
|
+
audyn/utils/driver/_conf_template/train/dataset/sortable-torch.yaml
|
|
173
|
+
audyn/utils/driver/_conf_template/train/dataset/torch.yaml
|
|
174
|
+
audyn/utils/driver/_conf_template/train/dataset/webdataset.yaml
|
|
175
|
+
audyn/utils/driver/_conf_template/train/record/defaults.yaml
|
|
176
|
+
audyn/utils/driver/_conf_template/train/record/template.yaml
|
|
177
|
+
audyn/utils/duration/__init__.py
|
|
178
|
+
audyn/utils/github/__init__.py
|
|
179
|
+
audyn/utils/hydra/__init__.py
|
|
180
|
+
audyn/utils/hydra/utils.py
|
|
181
|
+
audyn/utils/lab/__init__.py
|
|
182
|
+
audyn/utils/logging/__init__.py
|
|
183
|
+
audyn/utils/model/__init__.py
|
|
184
|
+
audyn/utils/music/__init__.py
|
|
185
|
+
audyn/utils/parallel/__init__.py
|
|
186
|
+
audyn/utils/tensorboard/__init__.py
|
|
187
|
+
audyn/utils/text/__init__.py
|
|
188
|
+
audyn/utils/text/indexing.py
|
|
189
|
+
audyn/utils/text/normalization.py
|
|
190
|
+
audyn/utils/text/pronunciation.py
|
|
191
|
+
audyn/utils/text/tokenization.py
|
|
192
|
+
audyn/utils/textgrid/__init__.py
|
|
193
|
+
cpp_extensions/monotonic_align/monotonic_align.cpp
|
|
@@ -6,12 +6,24 @@ torchaudio
|
|
|
6
6
|
torchtext
|
|
7
7
|
torchvision
|
|
8
8
|
tensorboard
|
|
9
|
+
webdataset
|
|
10
|
+
inflect
|
|
11
|
+
|
|
12
|
+
[:python_version == "3.8"]
|
|
13
|
+
importlib_resources<6.2
|
|
9
14
|
|
|
10
15
|
[dev]
|
|
11
16
|
flake8
|
|
12
17
|
black
|
|
13
18
|
isort
|
|
14
19
|
|
|
20
|
+
[docs]
|
|
21
|
+
sphinx
|
|
22
|
+
sphinx-autodoc-typehints
|
|
23
|
+
sphinx-autobuild
|
|
24
|
+
nbsphinx
|
|
25
|
+
furo
|
|
26
|
+
|
|
15
27
|
[recipes]
|
|
16
28
|
tqdm
|
|
17
29
|
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.1
|
|
2
2
|
Name: Audyn
|
|
3
|
-
Version: 0.0.1.
|
|
3
|
+
Version: 0.0.1.dev7
|
|
4
4
|
Summary: A PyTorch toolkit for audio synthesis.
|
|
5
5
|
Author: Takuya Hasumi
|
|
6
6
|
License: Apache License
|
|
@@ -209,6 +209,7 @@ Project-URL: url, https://github.com/tky823/Audyn
|
|
|
209
209
|
Requires-Python: <4,>=3.8
|
|
210
210
|
Description-Content-Type: text/markdown
|
|
211
211
|
License-File: LICENSE
|
|
212
|
+
Requires-Dist: importlib_resources<6.2; python_version == "3.8"
|
|
212
213
|
Requires-Dist: omegaconf
|
|
213
214
|
Requires-Dist: hydra-core
|
|
214
215
|
Requires-Dist: matplotlib
|
|
@@ -217,17 +218,27 @@ Requires-Dist: torchaudio
|
|
|
217
218
|
Requires-Dist: torchtext
|
|
218
219
|
Requires-Dist: torchvision
|
|
219
220
|
Requires-Dist: tensorboard
|
|
221
|
+
Requires-Dist: webdataset
|
|
222
|
+
Requires-Dist: inflect
|
|
220
223
|
Provides-Extra: recipes
|
|
221
224
|
Requires-Dist: tqdm; extra == "recipes"
|
|
222
225
|
Provides-Extra: dev
|
|
223
226
|
Requires-Dist: flake8; extra == "dev"
|
|
224
227
|
Requires-Dist: black; extra == "dev"
|
|
225
228
|
Requires-Dist: isort; extra == "dev"
|
|
229
|
+
Provides-Extra: docs
|
|
230
|
+
Requires-Dist: sphinx; extra == "docs"
|
|
231
|
+
Requires-Dist: sphinx-autodoc-typehints; extra == "docs"
|
|
232
|
+
Requires-Dist: sphinx-autobuild; extra == "docs"
|
|
233
|
+
Requires-Dist: nbsphinx; extra == "docs"
|
|
234
|
+
Requires-Dist: furo; extra == "docs"
|
|
226
235
|
Provides-Extra: tests
|
|
227
236
|
Requires-Dist: pytest; extra == "tests"
|
|
228
237
|
Requires-Dist: pytest-cov; extra == "tests"
|
|
229
238
|
|
|
230
239
|
# Audyn
|
|
240
|
+
[](https://codecov.io/gh/tky823/Audyn)
|
|
241
|
+
|
|
231
242
|
Audyn is PyTorch toolkit for audio synthesis.
|
|
232
243
|
|
|
233
244
|
## Installation
|
|
@@ -248,12 +259,43 @@ If you need to run recipes, add `[recipes]` as follows:
|
|
|
248
259
|
pip install -e ".[recipes]"
|
|
249
260
|
```
|
|
250
261
|
|
|
262
|
+
If you use MacOS, you may need to set `MACOSX_DEPLOYMENT_TARGET` during installation to build C++ related modules.
|
|
263
|
+
|
|
264
|
+
### C++ extension
|
|
265
|
+
We use [C++ extension](https://pytorch.org/tutorials/advanced/cpp_extension.html) to search monotonic alignment in some models (e.g. GlowTTS).
|
|
266
|
+
To take full advantage of computational efficiency, set appropriate value of `OMP_NUM_THREADS` and `CXX` during installation:
|
|
267
|
+
|
|
268
|
+
```shell
|
|
269
|
+
# In Audyn/
|
|
270
|
+
export CXX=<PATH/TO/CPP/COMPILER> # e.g. /usr/bin/c++
|
|
271
|
+
export OMP_NUM_THREADS=<SUITABLE/VALUE/FOR/ENVIRONMENT>
|
|
272
|
+
pip install -e "."
|
|
273
|
+
```
|
|
274
|
+
|
|
251
275
|
## Development
|
|
252
276
|
```shell
|
|
253
277
|
# In Audyn/
|
|
254
278
|
pip install -e ".[recipes,dev,tests]"
|
|
255
279
|
```
|
|
256
280
|
|
|
281
|
+
## Build Documentation Locally (optional)
|
|
282
|
+
To build the documentation locally, you have to include `docs` when installing `Audyn`.
|
|
283
|
+
```shell
|
|
284
|
+
pip install -e ".[docs]"
|
|
285
|
+
```
|
|
286
|
+
|
|
287
|
+
When you build the documentation, run the following command.
|
|
288
|
+
```shell
|
|
289
|
+
cd docs/
|
|
290
|
+
make html
|
|
291
|
+
```
|
|
292
|
+
|
|
293
|
+
Or, you can build the documentation automatically using `sphinx-autobuild`.
|
|
294
|
+
```shell
|
|
295
|
+
# in Audyn/
|
|
296
|
+
sphinx-autobuild docs docs/_build/html
|
|
297
|
+
```
|
|
298
|
+
|
|
257
299
|
## Test
|
|
258
300
|
```shell
|
|
259
301
|
pytest tests/package
|
|
@@ -0,0 +1,64 @@
|
|
|
1
|
+
# Audyn
|
|
2
|
+
[](https://codecov.io/gh/tky823/Audyn)
|
|
3
|
+
|
|
4
|
+
Audyn is PyTorch toolkit for audio synthesis.
|
|
5
|
+
|
|
6
|
+
## Installation
|
|
7
|
+
You can install by pip.
|
|
8
|
+
```shell
|
|
9
|
+
pip install git+https://github.com/tky823/Audyn.git
|
|
10
|
+
```
|
|
11
|
+
or clone this repository.
|
|
12
|
+
```shell
|
|
13
|
+
git clone https://github.com/tky823/Audyn.git
|
|
14
|
+
cd Audyn
|
|
15
|
+
pip install -e .
|
|
16
|
+
```
|
|
17
|
+
|
|
18
|
+
If you need to run recipes, add `[recipes]` as follows:
|
|
19
|
+
```shell
|
|
20
|
+
# In Audyn/
|
|
21
|
+
pip install -e ".[recipes]"
|
|
22
|
+
```
|
|
23
|
+
|
|
24
|
+
If you use MacOS, you may need to set `MACOSX_DEPLOYMENT_TARGET` during installation to build C++ related modules.
|
|
25
|
+
|
|
26
|
+
### C++ extension
|
|
27
|
+
We use [C++ extension](https://pytorch.org/tutorials/advanced/cpp_extension.html) to search monotonic alignment in some models (e.g. GlowTTS).
|
|
28
|
+
To take full advantage of computational efficiency, set appropriate value of `OMP_NUM_THREADS` and `CXX` during installation:
|
|
29
|
+
|
|
30
|
+
```shell
|
|
31
|
+
# In Audyn/
|
|
32
|
+
export CXX=<PATH/TO/CPP/COMPILER> # e.g. /usr/bin/c++
|
|
33
|
+
export OMP_NUM_THREADS=<SUITABLE/VALUE/FOR/ENVIRONMENT>
|
|
34
|
+
pip install -e "."
|
|
35
|
+
```
|
|
36
|
+
|
|
37
|
+
## Development
|
|
38
|
+
```shell
|
|
39
|
+
# In Audyn/
|
|
40
|
+
pip install -e ".[recipes,dev,tests]"
|
|
41
|
+
```
|
|
42
|
+
|
|
43
|
+
## Build Documentation Locally (optional)
|
|
44
|
+
To build the documentation locally, you have to include `docs` when installing `Audyn`.
|
|
45
|
+
```shell
|
|
46
|
+
pip install -e ".[docs]"
|
|
47
|
+
```
|
|
48
|
+
|
|
49
|
+
When you build the documentation, run the following command.
|
|
50
|
+
```shell
|
|
51
|
+
cd docs/
|
|
52
|
+
make html
|
|
53
|
+
```
|
|
54
|
+
|
|
55
|
+
Or, you can build the documentation automatically using `sphinx-autobuild`.
|
|
56
|
+
```shell
|
|
57
|
+
# in Audyn/
|
|
58
|
+
sphinx-autobuild docs docs/_build/html
|
|
59
|
+
```
|
|
60
|
+
|
|
61
|
+
## Test
|
|
62
|
+
```shell
|
|
63
|
+
pytest tests/package
|
|
64
|
+
```
|
|
@@ -0,0 +1,61 @@
|
|
|
1
|
+
import importlib
|
|
2
|
+
import operator
|
|
3
|
+
import re
|
|
4
|
+
from typing import Any
|
|
5
|
+
|
|
6
|
+
from omegaconf import OmegaConf
|
|
7
|
+
|
|
8
|
+
from .utils.hydra import main
|
|
9
|
+
|
|
10
|
+
__all__ = ["__version__", "main"]
|
|
11
|
+
|
|
12
|
+
__version__ = "0.0.1.dev7"
|
|
13
|
+
|
|
14
|
+
# for resolver
|
|
15
|
+
_whitespace_re = re.compile(r"\s+")
|
|
16
|
+
_int_re = re.compile(r"^\d+$")
|
|
17
|
+
_float_re = re.compile(r"^[0-9]*\.?[0-9]+([eE][-+]?[0-9]+)?$")
|
|
18
|
+
|
|
19
|
+
|
|
20
|
+
def _constant_resolver(full_var_name: str) -> Any:
|
|
21
|
+
if "+" in full_var_name:
|
|
22
|
+
# TODO: generalize
|
|
23
|
+
# to support whitespace, e.g. ${const:audyn.utils.data.clotho.vocab_size + 1}
|
|
24
|
+
full_var_names = full_var_name.split("+")
|
|
25
|
+
resolved = _resolve(full_var_names[0])
|
|
26
|
+
|
|
27
|
+
for _full_var_name in full_var_names[1:]:
|
|
28
|
+
_full_var_name = _whitespace_re.sub("", _full_var_name)
|
|
29
|
+
|
|
30
|
+
if _int_re.match(_full_var_name):
|
|
31
|
+
_resolved = int(_full_var_name)
|
|
32
|
+
elif _float_re.match(_full_var_name):
|
|
33
|
+
_resolved = float(_full_var_name)
|
|
34
|
+
else:
|
|
35
|
+
raise ValueError(f"{_full_var_name} cannot be converted to int nor float.")
|
|
36
|
+
|
|
37
|
+
resolved = operator.add(resolved, _resolved)
|
|
38
|
+
else:
|
|
39
|
+
resolved = _resolve(full_var_name)
|
|
40
|
+
|
|
41
|
+
return resolved
|
|
42
|
+
|
|
43
|
+
|
|
44
|
+
def _resolve(full_var_name: str) -> Any:
|
|
45
|
+
full_var_name = full_var_name.strip()
|
|
46
|
+
mod_name, var_name = full_var_name.rsplit(".", maxsplit=1)
|
|
47
|
+
|
|
48
|
+
try:
|
|
49
|
+
resolved = getattr(importlib.import_module(mod_name), var_name)
|
|
50
|
+
except ModuleNotFoundError:
|
|
51
|
+
# TODO: generalize
|
|
52
|
+
attr_name = var_name
|
|
53
|
+
mod_name, var_name = mod_name.rsplit(".", maxsplit=1)
|
|
54
|
+
imported_module = importlib.import_module(mod_name)
|
|
55
|
+
cls = getattr(imported_module, var_name)
|
|
56
|
+
resolved = getattr(cls, attr_name)
|
|
57
|
+
|
|
58
|
+
return resolved
|
|
59
|
+
|
|
60
|
+
|
|
61
|
+
OmegaConf.register_new_resolver("const", _constant_resolver)
|
|
@@ -30,13 +30,13 @@ class MultiCriteria(nn.ModuleDict):
|
|
|
30
30
|
|
|
31
31
|
Examples:
|
|
32
32
|
|
|
33
|
-
>>> import
|
|
33
|
+
>>> import audyn
|
|
34
34
|
>>> import torch
|
|
35
35
|
>>> torch.manual_seed(0)
|
|
36
36
|
>>> config = {
|
|
37
|
-
... "_target_": "audyn.criterion.
|
|
37
|
+
... "_target_": "audyn.criterion.MultiCriteria",
|
|
38
38
|
... "mse": {
|
|
39
|
-
... "_target_": "audyn.criterion.
|
|
39
|
+
... "_target_": "audyn.criterion.BaseCriterionWrapper",
|
|
40
40
|
... "criterion": {
|
|
41
41
|
... "_target_": "torch.nn.MSELoss",
|
|
42
42
|
... "reduction": "mean",
|
|
@@ -52,7 +52,7 @@ class MultiCriteria(nn.ModuleDict):
|
|
|
52
52
|
... }
|
|
53
53
|
... },
|
|
54
54
|
... "mae": {
|
|
55
|
-
... "_target_": "audyn.criterion.
|
|
55
|
+
... "_target_": "audyn.criterion.BaseCriterionWrapper",
|
|
56
56
|
... "criterion": {
|
|
57
57
|
... "_target_": "torch.nn.L1Loss",
|
|
58
58
|
... "reduction": "mean",
|
|
@@ -68,7 +68,7 @@ class MultiCriteria(nn.ModuleDict):
|
|
|
68
68
|
... }
|
|
69
69
|
... }
|
|
70
70
|
>>> }
|
|
71
|
-
>>> criterion =
|
|
71
|
+
>>> criterion = audyn.utils.instantiate_criterion(config)
|
|
72
72
|
>>> y = torch.randn((4,))
|
|
73
73
|
>>> t_mse = torch.randn_like(y)
|
|
74
74
|
>>> t_mae = torch.randn_like(y)
|