Audyn 0.0.1.dev1__tar.gz → 0.0.1.dev6__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (212) hide show
  1. {Audyn-0.0.1.dev1 → audyn-0.0.1.dev6}/Audyn.egg-info/PKG-INFO +43 -1
  2. audyn-0.0.1.dev6/Audyn.egg-info/SOURCES.txt +190 -0
  3. {Audyn-0.0.1.dev1 → audyn-0.0.1.dev6}/Audyn.egg-info/requires.txt +12 -0
  4. {Audyn-0.0.1.dev1 → audyn-0.0.1.dev6}/MANIFEST.in +2 -1
  5. {Audyn-0.0.1.dev1 → audyn-0.0.1.dev6}/PKG-INFO +43 -1
  6. audyn-0.0.1.dev6/README.md +64 -0
  7. audyn-0.0.1.dev6/audyn/__init__.py +61 -0
  8. audyn-0.0.1.dev6/audyn/criterion/__init__.py +6 -0
  9. {Audyn-0.0.1.dev1 → audyn-0.0.1.dev6}/audyn/criterion/base.py +5 -5
  10. audyn-0.0.1.dev6/audyn/criterion/contrastive.py +698 -0
  11. audyn-0.0.1.dev6/audyn/criterion/distance.py +123 -0
  12. {Audyn-0.0.1.dev1 → audyn-0.0.1.dev6}/audyn/criterion/flow.py +37 -4
  13. audyn-0.0.1.dev6/audyn/criterion/gan.py +49 -0
  14. audyn-0.0.1.dev6/audyn/criterion/glowtts.py +96 -0
  15. {Audyn-0.0.1.dev1 → audyn-0.0.1.dev6}/audyn/criterion/hifigan.py +20 -1
  16. {Audyn-0.0.1.dev1 → audyn-0.0.1.dev6}/audyn/criterion/melspectrogram.py +13 -1
  17. audyn-0.0.1.dev6/audyn/criterion/rvqvae.py +91 -0
  18. audyn-0.0.1.dev6/audyn/criterion/ssast.py +108 -0
  19. audyn-0.0.1.dev6/audyn/criterion/vqvae.py +95 -0
  20. audyn-0.0.1.dev6/audyn/functional/__init__.py +3 -0
  21. audyn-0.0.1.dev6/audyn/functional/activation.py +119 -0
  22. audyn-0.0.1.dev6/audyn/functional/clustering.py +237 -0
  23. audyn-0.0.1.dev6/audyn/functional/vector_quantization.py +97 -0
  24. audyn-0.0.1.dev6/audyn/metrics/__init__.py +62 -0
  25. audyn-0.0.1.dev6/audyn/metrics/base.py +98 -0
  26. audyn-0.0.1.dev6/audyn/metrics/crossmodal.py +191 -0
  27. audyn-0.0.1.dev6/audyn/metrics/retrieval.py +182 -0
  28. audyn-0.0.1.dev6/audyn/models/__init__.py +53 -0
  29. audyn-0.0.1.dev6/audyn/models/ast.py +686 -0
  30. audyn-0.0.1.dev6/audyn/models/encodec.py +470 -0
  31. {Audyn-0.0.1.dev1 → audyn-0.0.1.dev6}/audyn/models/fastspeech.py +236 -88
  32. audyn-0.0.1.dev6/audyn/models/glowtts.py +1111 -0
  33. {Audyn-0.0.1.dev1 → audyn-0.0.1.dev6}/audyn/models/hifigan.py +10 -0
  34. audyn-0.0.1.dev6/audyn/models/lextransformer.py +449 -0
  35. audyn-0.0.1.dev6/audyn/models/passt.py +237 -0
  36. audyn-0.0.1.dev6/audyn/models/pixelsnail.py +203 -0
  37. audyn-0.0.1.dev6/audyn/models/roformer.py +468 -0
  38. audyn-0.0.1.dev6/audyn/models/rvqvae.py +235 -0
  39. audyn-0.0.1.dev6/audyn/models/soundstream.py +737 -0
  40. audyn-0.0.1.dev6/audyn/models/ssast.py +1008 -0
  41. {Audyn-0.0.1.dev1 → audyn-0.0.1.dev6}/audyn/models/text_to_wave.py +57 -50
  42. audyn-0.0.1.dev6/audyn/models/vae.py +24 -0
  43. audyn-0.0.1.dev6/audyn/models/vqvae.py +183 -0
  44. {Audyn-0.0.1.dev1 → audyn-0.0.1.dev6}/audyn/models/waveglow.py +63 -52
  45. {Audyn-0.0.1.dev1 → audyn-0.0.1.dev6}/audyn/models/wavenet.py +63 -36
  46. audyn-0.0.1.dev6/audyn/modules/activation.py +1166 -0
  47. {Audyn-0.0.1.dev1 → audyn-0.0.1.dev6}/audyn/modules/duration_predictor.py +40 -10
  48. audyn-0.0.1.dev6/audyn/modules/encodec.py +329 -0
  49. {Audyn-0.0.1.dev1 → audyn-0.0.1.dev6}/audyn/modules/fastspeech.py +4 -12
  50. {Audyn-0.0.1.dev1 → audyn-0.0.1.dev6}/audyn/modules/flow.py +4 -6
  51. {Audyn-0.0.1.dev1 → audyn-0.0.1.dev6}/audyn/modules/glow.py +133 -27
  52. {Audyn-0.0.1.dev1 → audyn-0.0.1.dev6}/audyn/modules/glowtts.py +363 -47
  53. audyn-0.0.1.dev6/audyn/modules/passt.py +574 -0
  54. audyn-0.0.1.dev6/audyn/modules/pixelcnn.py +319 -0
  55. audyn-0.0.1.dev6/audyn/modules/pixelsnail.py +545 -0
  56. audyn-0.0.1.dev6/audyn/modules/positional_encoding.py +219 -0
  57. audyn-0.0.1.dev6/audyn/modules/rvq.py +156 -0
  58. audyn-0.0.1.dev6/audyn/modules/soundstream.py +307 -0
  59. audyn-0.0.1.dev6/audyn/modules/vit.py +468 -0
  60. audyn-0.0.1.dev6/audyn/modules/vq.py +245 -0
  61. audyn-0.0.1.dev6/audyn/modules/vqvae.py +5 -0
  62. {Audyn-0.0.1.dev1 → audyn-0.0.1.dev6}/audyn/modules/waveglow.py +28 -28
  63. {Audyn-0.0.1.dev1 → audyn-0.0.1.dev6}/audyn/modules/wavenet.py +34 -34
  64. audyn-0.0.1.dev6/audyn/optim/lr_scheduler.py +182 -0
  65. audyn-0.0.1.dev6/audyn/optim/optimizer.py +1447 -0
  66. audyn-0.0.1.dev6/audyn/transforms/__init__.py +23 -0
  67. audyn-0.0.1.dev6/audyn/transforms/ast.py +185 -0
  68. audyn-0.0.1.dev6/audyn/transforms/birdclef.py +168 -0
  69. audyn-0.0.1.dev6/audyn/transforms/cqt.py +705 -0
  70. audyn-0.0.1.dev6/audyn/transforms/hifigan.py +95 -0
  71. audyn-0.0.1.dev6/audyn/transforms/hubert.py +59 -0
  72. audyn-0.0.1.dev6/audyn/transforms/kaldi.py +461 -0
  73. audyn-0.0.1.dev6/audyn/transforms/librosa.py +83 -0
  74. audyn-0.0.1.dev6/audyn/utils/__init__.py +628 -0
  75. {Audyn-0.0.1.dev1 → audyn-0.0.1.dev6}/audyn/utils/alignment/__init__.py +10 -3
  76. audyn-0.0.1.dev6/audyn/utils/alignment/monotonic_align.py +66 -0
  77. audyn-0.0.1.dev6/audyn/utils/clip_grad.py +171 -0
  78. {Audyn-0.0.1.dev1 → audyn-0.0.1.dev6}/audyn/utils/data/__init__.py +12 -51
  79. audyn-0.0.1.dev6/audyn/utils/data/audioset/__init__.py +9 -0
  80. audyn-0.0.1.dev6/audyn/utils/data/audioset/_download.py +53 -0
  81. audyn-0.0.1.dev6/audyn/utils/data/audioset/ast.py +7 -0
  82. audyn-0.0.1.dev6/audyn/utils/data/audioset/composer.py +190 -0
  83. audyn-0.0.1.dev6/audyn/utils/data/audioset/dataset.py +516 -0
  84. audyn-0.0.1.dev6/audyn/utils/data/audioset/distributed.py +105 -0
  85. audyn-0.0.1.dev6/audyn/utils/data/audioset/sampler.py +102 -0
  86. audyn-0.0.1.dev6/audyn/utils/data/birdclef/birdclef2024/__init__.py +196 -0
  87. audyn-0.0.1.dev6/audyn/utils/data/birdclef/birdclef2024/_download.py +32 -0
  88. audyn-0.0.1.dev6/audyn/utils/data/birdclef/birdclef2024/collator.py +54 -0
  89. audyn-0.0.1.dev6/audyn/utils/data/birdclef/birdclef2024/composer.py +290 -0
  90. audyn-0.0.1.dev6/audyn/utils/data/birdclef/birdclef2024/dataset.py +217 -0
  91. audyn-0.0.1.dev6/audyn/utils/data/birdclef/birdclef2024/models/baseline.py +65 -0
  92. audyn-0.0.1.dev6/audyn/utils/data/clotho/__init__.py +37 -0
  93. audyn-0.0.1.dev6/audyn/utils/data/clotho/text/indexing.py +113 -0
  94. audyn-0.0.1.dev6/audyn/utils/data/clotho/text/normalization.py +27 -0
  95. audyn-0.0.1.dev6/audyn/utils/data/clotho/text/symbols.py +9 -0
  96. audyn-0.0.1.dev6/audyn/utils/data/clotho/text/tokenization.py +25 -0
  97. audyn-0.0.1.dev6/audyn/utils/data/cmudict/__init__.py +223 -0
  98. audyn-0.0.1.dev6/audyn/utils/data/cmudict/indexing.py +39 -0
  99. audyn-0.0.1.dev6/audyn/utils/data/collator.py +126 -0
  100. audyn-0.0.1.dev6/audyn/utils/data/composer.py +110 -0
  101. {Audyn-0.0.1.dev1 → audyn-0.0.1.dev6}/audyn/utils/data/dataloader.py +72 -40
  102. audyn-0.0.1.dev6/audyn/utils/data/dataset.py +196 -0
  103. audyn-0.0.1.dev6/audyn/utils/data/postprocess.py +320 -0
  104. {Audyn-0.0.1.dev1 → audyn-0.0.1.dev6}/audyn/utils/data/sampler.py +4 -1
  105. audyn-0.0.1.dev6/audyn/utils/data/tacotron/__init__.py +30 -0
  106. audyn-0.0.1.dev6/audyn/utils/data/tacotron/text/indexing.py +33 -0
  107. audyn-0.0.1.dev6/audyn/utils/data/tacotron/text/normalization.py +118 -0
  108. audyn-0.0.1.dev6/audyn/utils/data/tacotron/text/numbers.py +83 -0
  109. audyn-0.0.1.dev6/audyn/utils/data/tacotron/text/symbols.py +90 -0
  110. audyn-0.0.1.dev6/audyn/utils/data/tacotron/text/tokenization.py +26 -0
  111. audyn-0.0.1.dev6/audyn/utils/data/webdataset.py +72 -0
  112. {Audyn-0.0.1.dev1 → audyn-0.0.1.dev6}/audyn/utils/distributed/__init__.py +8 -1
  113. {Audyn-0.0.1.dev1 → audyn-0.0.1.dev6}/audyn/utils/driver/__init__.py +4 -2
  114. audyn-0.0.1.dev6/audyn/utils/driver/_conf_template/config.yaml +15 -0
  115. audyn-0.0.1.dev6/audyn/utils/driver/_conf_template/criterion/cross_entropy.yaml +15 -0
  116. audyn-0.0.1.dev6/audyn/utils/driver/_conf_template/criterion/vqvae.yaml +34 -0
  117. audyn-0.0.1.dev6/audyn/utils/driver/_conf_template/data/defaults.yaml +2 -0
  118. audyn-0.0.1.dev6/audyn/utils/driver/_conf_template/lr_scheduler/defaults.yaml +0 -0
  119. audyn-0.0.1.dev6/audyn/utils/driver/_conf_template/lr_scheduler/none.yaml +0 -0
  120. audyn-0.0.1.dev6/audyn/utils/driver/_conf_template/lr_scheduler/transformer.yaml +3 -0
  121. audyn-0.0.1.dev6/audyn/utils/driver/_conf_template/model/defaults.yaml +0 -0
  122. audyn-0.0.1.dev6/audyn/utils/driver/_conf_template/model/gan.yaml +2 -0
  123. audyn-0.0.1.dev6/audyn/utils/driver/_conf_template/optimizer/adam.yaml +1 -0
  124. audyn-0.0.1.dev6/audyn/utils/driver/_conf_template/optimizer/adam_ema.yaml +5 -0
  125. audyn-0.0.1.dev6/audyn/utils/driver/_conf_template/optimizer/adamw.yaml +1 -0
  126. audyn-0.0.1.dev6/audyn/utils/driver/_conf_template/optimizer/gan.yaml +2 -0
  127. audyn-0.0.1.dev6/audyn/utils/driver/_conf_template/preprocess/defaults.yaml +6 -0
  128. audyn-0.0.1.dev6/audyn/utils/driver/_conf_template/preprocess/ljspeech_text-to-feat.yaml +6 -0
  129. audyn-0.0.1.dev6/audyn/utils/driver/_conf_template/preprocess/text-to-feat.yaml +5 -0
  130. audyn-0.0.1.dev6/audyn/utils/driver/_conf_template/preprocess/text-to-wave.yaml +5 -0
  131. audyn-0.0.1.dev6/audyn/utils/driver/_conf_template/system/cpu.yaml +11 -0
  132. audyn-0.0.1.dev6/audyn/utils/driver/_conf_template/system/cuda.yaml +11 -0
  133. audyn-0.0.1.dev6/audyn/utils/driver/_conf_template/system/cuda_amp.yaml +11 -0
  134. audyn-0.0.1.dev6/audyn/utils/driver/_conf_template/system/cuda_ddp.yaml +11 -0
  135. audyn-0.0.1.dev6/audyn/utils/driver/_conf_template/system/cuda_ddp_amp.yaml +11 -0
  136. audyn-0.0.1.dev6/audyn/utils/driver/_conf_template/system/defaults.yaml +11 -0
  137. audyn-0.0.1.dev6/audyn/utils/driver/_conf_template/system/mps.yaml +11 -0
  138. audyn-0.0.1.dev6/audyn/utils/driver/_conf_template/test/dataloader/defaults.yaml +4 -0
  139. audyn-0.0.1.dev6/audyn/utils/driver/_conf_template/test/dataset/defaults.yaml +3 -0
  140. audyn-0.0.1.dev6/audyn/utils/driver/_conf_template/test/dataset/torch.yaml +4 -0
  141. audyn-0.0.1.dev6/audyn/utils/driver/_conf_template/test/defaults.yaml +28 -0
  142. audyn-0.0.1.dev6/audyn/utils/driver/_conf_template/test/text_to_wave.yaml +36 -0
  143. audyn-0.0.1.dev6/audyn/utils/driver/_conf_template/train/clip_gradient/defaults.yaml +0 -0
  144. audyn-0.0.1.dev6/audyn/utils/driver/_conf_template/train/clip_gradient/gan.yaml +6 -0
  145. audyn-0.0.1.dev6/audyn/utils/driver/_conf_template/train/dataloader/defaults.yaml +8 -0
  146. audyn-0.0.1.dev6/audyn/utils/driver/_conf_template/train/dataloader/sequential-batch.yaml +9 -0
  147. audyn-0.0.1.dev6/audyn/utils/driver/_conf_template/train/dataset/defaults.yaml +6 -0
  148. audyn-0.0.1.dev6/audyn/utils/driver/_conf_template/train/dataset/sortable-torch.yaml +9 -0
  149. audyn-0.0.1.dev6/audyn/utils/driver/_conf_template/train/dataset/torch.yaml +8 -0
  150. audyn-0.0.1.dev6/audyn/utils/driver/_conf_template/train/dataset/webdataset.yaml +8 -0
  151. audyn-0.0.1.dev6/audyn/utils/driver/_conf_template/train/defaults.yaml +35 -0
  152. audyn-0.0.1.dev6/audyn/utils/driver/_conf_template/train/gan.yaml +51 -0
  153. audyn-0.0.1.dev6/audyn/utils/driver/_conf_template/train/record/defaults.yaml +0 -0
  154. audyn-0.0.1.dev6/audyn/utils/driver/_conf_template/train/record/template.yaml +58 -0
  155. audyn-0.0.1.dev6/audyn/utils/driver/_conf_template/train/template.yaml +45 -0
  156. audyn-0.0.1.dev6/audyn/utils/driver/_conf_template/train/text-to-feat+pretrained_feat-to-wave.yaml +51 -0
  157. audyn-0.0.1.dev6/audyn/utils/driver/base.py +2585 -0
  158. {Audyn-0.0.1.dev1 → audyn-0.0.1.dev6}/audyn/utils/driver/feat_to_wave.py +4 -1
  159. {Audyn-0.0.1.dev1 → audyn-0.0.1.dev6}/audyn/utils/driver/gan.py +357 -339
  160. audyn-0.0.1.dev6/audyn/utils/driver/text_to_feat.py +461 -0
  161. {Audyn-0.0.1.dev1 → audyn-0.0.1.dev6}/audyn/utils/driver/text_to_wave.py +34 -9
  162. audyn-0.0.1.dev6/audyn/utils/duration/__init__.py +44 -0
  163. audyn-0.0.1.dev6/audyn/utils/github/__init__.py +133 -0
  164. audyn-0.0.1.dev6/audyn/utils/hydra/utils.py +515 -0
  165. audyn-0.0.1.dev6/audyn/utils/lab/__init__.py +17 -0
  166. audyn-0.0.1.dev6/audyn/utils/model/__init__.py +68 -0
  167. audyn-0.0.1.dev6/audyn/utils/music/__init__.py +66 -0
  168. audyn-0.0.1.dev6/audyn/utils/text/__init__.py +272 -0
  169. audyn-0.0.1.dev6/audyn/utils/text/indexing.py +22 -0
  170. audyn-0.0.1.dev6/audyn/utils/text/normalization.py +22 -0
  171. audyn-0.0.1.dev6/audyn/utils/text/pronunciation.py +49 -0
  172. audyn-0.0.1.dev6/audyn/utils/text/tokenization.py +57 -0
  173. audyn-0.0.1.dev6/cpp_extensions/monotonic_align/monotonic_align.cpp +96 -0
  174. {Audyn-0.0.1.dev1 → audyn-0.0.1.dev6}/pyproject.toml +18 -1
  175. audyn-0.0.1.dev6/setup.py +149 -0
  176. Audyn-0.0.1.dev1/Audyn.egg-info/SOURCES.txt +0 -65
  177. Audyn-0.0.1.dev1/README.md +0 -31
  178. Audyn-0.0.1.dev1/audyn/__init__.py +0 -19
  179. Audyn-0.0.1.dev1/audyn/criterion/gan.py +0 -9
  180. Audyn-0.0.1.dev1/audyn/models/__init__.py +0 -12
  181. Audyn-0.0.1.dev1/audyn/models/glowtts.py +0 -675
  182. Audyn-0.0.1.dev1/audyn/modules/positional_encoding.py +0 -58
  183. Audyn-0.0.1.dev1/audyn/optim/lr_scheduler.py +0 -38
  184. Audyn-0.0.1.dev1/audyn/optim/optimizer.py +0 -295
  185. Audyn-0.0.1.dev1/audyn/utils/__init__.py +0 -41
  186. Audyn-0.0.1.dev1/audyn/utils/alignment/monotonic_align.py +0 -26
  187. Audyn-0.0.1.dev1/audyn/utils/data/cmudict/__init__.py +0 -92
  188. Audyn-0.0.1.dev1/audyn/utils/data/dataset.py +0 -62
  189. Audyn-0.0.1.dev1/audyn/utils/data/postprocess.py +0 -231
  190. Audyn-0.0.1.dev1/audyn/utils/driver/base.py +0 -1568
  191. Audyn-0.0.1.dev1/audyn/utils/driver/text_to_feat.py +0 -31
  192. Audyn-0.0.1.dev1/audyn/utils/hydra/utils.py +0 -104
  193. Audyn-0.0.1.dev1/audyn/utils/model/__init__.py +0 -21
  194. Audyn-0.0.1.dev1/cpp_extensions/monotonic_align/monotonic_align.cpp +0 -108
  195. Audyn-0.0.1.dev1/setup.py +0 -32
  196. {Audyn-0.0.1.dev1 → audyn-0.0.1.dev6}/Audyn.egg-info/dependency_links.txt +0 -0
  197. {Audyn-0.0.1.dev1 → audyn-0.0.1.dev6}/Audyn.egg-info/top_level.txt +0 -0
  198. {Audyn-0.0.1.dev1 → audyn-0.0.1.dev6}/LICENSE +0 -0
  199. {Audyn-0.0.1.dev1 → audyn-0.0.1.dev6}/audyn/criterion/autoregressive.py +0 -0
  200. {Audyn-0.0.1.dev1 → audyn-0.0.1.dev6}/audyn/criterion/fastspeech.py +0 -0
  201. {Audyn-0.0.1.dev1 → audyn-0.0.1.dev6}/audyn/criterion/lsgan.py +0 -0
  202. {Audyn-0.0.1.dev1 → audyn-0.0.1.dev6}/audyn/models/gan.py +0 -0
  203. {Audyn-0.0.1.dev1 → audyn-0.0.1.dev6}/audyn/modules/film.py +0 -0
  204. {Audyn-0.0.1.dev1 → audyn-0.0.1.dev6}/audyn/modules/normalization.py +0 -0
  205. {Audyn-0.0.1.dev1 → audyn-0.0.1.dev6}/audyn/utils/data/distributed.py +0 -0
  206. {Audyn-0.0.1.dev1 → audyn-0.0.1.dev6}/audyn/utils/driver/_decorator.py +0 -0
  207. {Audyn-0.0.1.dev1 → audyn-0.0.1.dev6}/audyn/utils/hydra/__init__.py +0 -0
  208. {Audyn-0.0.1.dev1 → audyn-0.0.1.dev6}/audyn/utils/logging/__init__.py +0 -0
  209. {Audyn-0.0.1.dev1 → audyn-0.0.1.dev6}/audyn/utils/parallel/__init__.py +0 -0
  210. {Audyn-0.0.1.dev1 → audyn-0.0.1.dev6}/audyn/utils/tensorboard/__init__.py +0 -0
  211. {Audyn-0.0.1.dev1 → audyn-0.0.1.dev6}/audyn/utils/textgrid/__init__.py +0 -0
  212. {Audyn-0.0.1.dev1 → audyn-0.0.1.dev6}/setup.cfg +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: Audyn
3
- Version: 0.0.1.dev1
3
+ Version: 0.0.1.dev6
4
4
  Summary: A PyTorch toolkit for audio synthesis.
5
5
  Author: Takuya Hasumi
6
6
  License: Apache License
@@ -209,6 +209,7 @@ Project-URL: url, https://github.com/tky823/Audyn
209
209
  Requires-Python: <4,>=3.8
210
210
  Description-Content-Type: text/markdown
211
211
  License-File: LICENSE
212
+ Requires-Dist: importlib_resources<6.2; python_version == "3.8"
212
213
  Requires-Dist: omegaconf
213
214
  Requires-Dist: hydra-core
214
215
  Requires-Dist: matplotlib
@@ -217,17 +218,27 @@ Requires-Dist: torchaudio
217
218
  Requires-Dist: torchtext
218
219
  Requires-Dist: torchvision
219
220
  Requires-Dist: tensorboard
221
+ Requires-Dist: webdataset
222
+ Requires-Dist: inflect
220
223
  Provides-Extra: recipes
221
224
  Requires-Dist: tqdm; extra == "recipes"
222
225
  Provides-Extra: dev
223
226
  Requires-Dist: flake8; extra == "dev"
224
227
  Requires-Dist: black; extra == "dev"
225
228
  Requires-Dist: isort; extra == "dev"
229
+ Provides-Extra: docs
230
+ Requires-Dist: sphinx; extra == "docs"
231
+ Requires-Dist: sphinx-autodoc-typehints; extra == "docs"
232
+ Requires-Dist: sphinx-autobuild; extra == "docs"
233
+ Requires-Dist: nbsphinx; extra == "docs"
234
+ Requires-Dist: furo; extra == "docs"
226
235
  Provides-Extra: tests
227
236
  Requires-Dist: pytest; extra == "tests"
228
237
  Requires-Dist: pytest-cov; extra == "tests"
229
238
 
230
239
  # Audyn
240
+ [![codecov](https://codecov.io/gh/tky823/Audyn/graph/badge.svg?token=7R29QDGXLQ)](https://codecov.io/gh/tky823/Audyn)
241
+
231
242
  Audyn is PyTorch toolkit for audio synthesis.
232
243
 
233
244
  ## Installation
@@ -248,12 +259,43 @@ If you need to run recipes, add `[recipes]` as follows:
248
259
  pip install -e ".[recipes]"
249
260
  ```
250
261
 
262
+ If you use MacOS, you may need to set `MACOSX_DEPLOYMENT_TARGET` during installation to build C++ related modules.
263
+
264
+ ### C++ extension
265
+ We use [C++ extension](https://pytorch.org/tutorials/advanced/cpp_extension.html) to search monotonic alignment in some models (e.g. GlowTTS).
266
+ To take full advantage of computational efficiency, set appropriate value of `OMP_NUM_THREADS` and `CXX` during installation:
267
+
268
+ ```shell
269
+ # In Audyn/
270
+ export CXX=<PATH/TO/CPP/COMPILER> # e.g. /usr/bin/c++
271
+ export OMP_NUM_THREADS=<SUITABLE/VALUE/FOR/ENVIRONMENT>
272
+ pip install -e "."
273
+ ```
274
+
251
275
  ## Development
252
276
  ```shell
253
277
  # In Audyn/
254
278
  pip install -e ".[recipes,dev,tests]"
255
279
  ```
256
280
 
281
+ ## Build Documentation Locally (optional)
282
+ To build the documentation locally, you have to include `docs` when installing `Audyn`.
283
+ ```shell
284
+ pip install -e ".[docs]"
285
+ ```
286
+
287
+ When you build the documentation, run the following command.
288
+ ```shell
289
+ cd docs/
290
+ make html
291
+ ```
292
+
293
+ Or, you can build the documentation automatically using `sphinx-autobuild`.
294
+ ```shell
295
+ # in Audyn/
296
+ sphinx-autobuild docs docs/_build/html
297
+ ```
298
+
257
299
  ## Test
258
300
  ```shell
259
301
  pytest tests/package
@@ -0,0 +1,190 @@
1
+ LICENSE
2
+ MANIFEST.in
3
+ README.md
4
+ pyproject.toml
5
+ setup.py
6
+ Audyn.egg-info/PKG-INFO
7
+ Audyn.egg-info/SOURCES.txt
8
+ Audyn.egg-info/dependency_links.txt
9
+ Audyn.egg-info/requires.txt
10
+ Audyn.egg-info/top_level.txt
11
+ audyn/__init__.py
12
+ audyn/criterion/__init__.py
13
+ audyn/criterion/autoregressive.py
14
+ audyn/criterion/base.py
15
+ audyn/criterion/contrastive.py
16
+ audyn/criterion/distance.py
17
+ audyn/criterion/fastspeech.py
18
+ audyn/criterion/flow.py
19
+ audyn/criterion/gan.py
20
+ audyn/criterion/glowtts.py
21
+ audyn/criterion/hifigan.py
22
+ audyn/criterion/lsgan.py
23
+ audyn/criterion/melspectrogram.py
24
+ audyn/criterion/rvqvae.py
25
+ audyn/criterion/ssast.py
26
+ audyn/criterion/vqvae.py
27
+ audyn/functional/__init__.py
28
+ audyn/functional/activation.py
29
+ audyn/functional/clustering.py
30
+ audyn/functional/vector_quantization.py
31
+ audyn/metrics/__init__.py
32
+ audyn/metrics/base.py
33
+ audyn/metrics/crossmodal.py
34
+ audyn/metrics/retrieval.py
35
+ audyn/models/__init__.py
36
+ audyn/models/ast.py
37
+ audyn/models/encodec.py
38
+ audyn/models/fastspeech.py
39
+ audyn/models/gan.py
40
+ audyn/models/glowtts.py
41
+ audyn/models/hifigan.py
42
+ audyn/models/lextransformer.py
43
+ audyn/models/passt.py
44
+ audyn/models/pixelsnail.py
45
+ audyn/models/roformer.py
46
+ audyn/models/rvqvae.py
47
+ audyn/models/soundstream.py
48
+ audyn/models/ssast.py
49
+ audyn/models/text_to_wave.py
50
+ audyn/models/vae.py
51
+ audyn/models/vqvae.py
52
+ audyn/models/waveglow.py
53
+ audyn/models/wavenet.py
54
+ audyn/modules/activation.py
55
+ audyn/modules/duration_predictor.py
56
+ audyn/modules/encodec.py
57
+ audyn/modules/fastspeech.py
58
+ audyn/modules/film.py
59
+ audyn/modules/flow.py
60
+ audyn/modules/glow.py
61
+ audyn/modules/glowtts.py
62
+ audyn/modules/normalization.py
63
+ audyn/modules/passt.py
64
+ audyn/modules/pixelcnn.py
65
+ audyn/modules/pixelsnail.py
66
+ audyn/modules/positional_encoding.py
67
+ audyn/modules/rvq.py
68
+ audyn/modules/soundstream.py
69
+ audyn/modules/vit.py
70
+ audyn/modules/vq.py
71
+ audyn/modules/vqvae.py
72
+ audyn/modules/waveglow.py
73
+ audyn/modules/wavenet.py
74
+ audyn/optim/lr_scheduler.py
75
+ audyn/optim/optimizer.py
76
+ audyn/transforms/__init__.py
77
+ audyn/transforms/ast.py
78
+ audyn/transforms/birdclef.py
79
+ audyn/transforms/cqt.py
80
+ audyn/transforms/hifigan.py
81
+ audyn/transforms/hubert.py
82
+ audyn/transforms/kaldi.py
83
+ audyn/transforms/librosa.py
84
+ audyn/utils/__init__.py
85
+ audyn/utils/clip_grad.py
86
+ audyn/utils/alignment/__init__.py
87
+ audyn/utils/alignment/monotonic_align.py
88
+ audyn/utils/data/__init__.py
89
+ audyn/utils/data/collator.py
90
+ audyn/utils/data/composer.py
91
+ audyn/utils/data/dataloader.py
92
+ audyn/utils/data/dataset.py
93
+ audyn/utils/data/distributed.py
94
+ audyn/utils/data/postprocess.py
95
+ audyn/utils/data/sampler.py
96
+ audyn/utils/data/webdataset.py
97
+ audyn/utils/data/audioset/__init__.py
98
+ audyn/utils/data/audioset/_download.py
99
+ audyn/utils/data/audioset/ast.py
100
+ audyn/utils/data/audioset/composer.py
101
+ audyn/utils/data/audioset/dataset.py
102
+ audyn/utils/data/audioset/distributed.py
103
+ audyn/utils/data/audioset/sampler.py
104
+ audyn/utils/data/birdclef/birdclef2024/__init__.py
105
+ audyn/utils/data/birdclef/birdclef2024/_download.py
106
+ audyn/utils/data/birdclef/birdclef2024/collator.py
107
+ audyn/utils/data/birdclef/birdclef2024/composer.py
108
+ audyn/utils/data/birdclef/birdclef2024/dataset.py
109
+ audyn/utils/data/birdclef/birdclef2024/models/baseline.py
110
+ audyn/utils/data/clotho/__init__.py
111
+ audyn/utils/data/clotho/text/indexing.py
112
+ audyn/utils/data/clotho/text/normalization.py
113
+ audyn/utils/data/clotho/text/symbols.py
114
+ audyn/utils/data/clotho/text/tokenization.py
115
+ audyn/utils/data/cmudict/__init__.py
116
+ audyn/utils/data/cmudict/indexing.py
117
+ audyn/utils/data/tacotron/__init__.py
118
+ audyn/utils/data/tacotron/text/indexing.py
119
+ audyn/utils/data/tacotron/text/normalization.py
120
+ audyn/utils/data/tacotron/text/numbers.py
121
+ audyn/utils/data/tacotron/text/symbols.py
122
+ audyn/utils/data/tacotron/text/tokenization.py
123
+ audyn/utils/distributed/__init__.py
124
+ audyn/utils/driver/__init__.py
125
+ audyn/utils/driver/_decorator.py
126
+ audyn/utils/driver/base.py
127
+ audyn/utils/driver/feat_to_wave.py
128
+ audyn/utils/driver/gan.py
129
+ audyn/utils/driver/text_to_feat.py
130
+ audyn/utils/driver/text_to_wave.py
131
+ audyn/utils/driver/_conf_template/config.yaml
132
+ audyn/utils/driver/_conf_template/criterion/cross_entropy.yaml
133
+ audyn/utils/driver/_conf_template/criterion/vqvae.yaml
134
+ audyn/utils/driver/_conf_template/data/defaults.yaml
135
+ audyn/utils/driver/_conf_template/lr_scheduler/defaults.yaml
136
+ audyn/utils/driver/_conf_template/lr_scheduler/none.yaml
137
+ audyn/utils/driver/_conf_template/lr_scheduler/transformer.yaml
138
+ audyn/utils/driver/_conf_template/model/defaults.yaml
139
+ audyn/utils/driver/_conf_template/model/gan.yaml
140
+ audyn/utils/driver/_conf_template/optimizer/adam.yaml
141
+ audyn/utils/driver/_conf_template/optimizer/adam_ema.yaml
142
+ audyn/utils/driver/_conf_template/optimizer/adamw.yaml
143
+ audyn/utils/driver/_conf_template/optimizer/gan.yaml
144
+ audyn/utils/driver/_conf_template/preprocess/defaults.yaml
145
+ audyn/utils/driver/_conf_template/preprocess/ljspeech_text-to-feat.yaml
146
+ audyn/utils/driver/_conf_template/preprocess/text-to-feat.yaml
147
+ audyn/utils/driver/_conf_template/preprocess/text-to-wave.yaml
148
+ audyn/utils/driver/_conf_template/system/cpu.yaml
149
+ audyn/utils/driver/_conf_template/system/cuda.yaml
150
+ audyn/utils/driver/_conf_template/system/cuda_amp.yaml
151
+ audyn/utils/driver/_conf_template/system/cuda_ddp.yaml
152
+ audyn/utils/driver/_conf_template/system/cuda_ddp_amp.yaml
153
+ audyn/utils/driver/_conf_template/system/defaults.yaml
154
+ audyn/utils/driver/_conf_template/system/mps.yaml
155
+ audyn/utils/driver/_conf_template/test/defaults.yaml
156
+ audyn/utils/driver/_conf_template/test/text_to_wave.yaml
157
+ audyn/utils/driver/_conf_template/test/dataloader/defaults.yaml
158
+ audyn/utils/driver/_conf_template/test/dataset/defaults.yaml
159
+ audyn/utils/driver/_conf_template/test/dataset/torch.yaml
160
+ audyn/utils/driver/_conf_template/train/defaults.yaml
161
+ audyn/utils/driver/_conf_template/train/gan.yaml
162
+ audyn/utils/driver/_conf_template/train/template.yaml
163
+ audyn/utils/driver/_conf_template/train/text-to-feat+pretrained_feat-to-wave.yaml
164
+ audyn/utils/driver/_conf_template/train/clip_gradient/defaults.yaml
165
+ audyn/utils/driver/_conf_template/train/clip_gradient/gan.yaml
166
+ audyn/utils/driver/_conf_template/train/dataloader/defaults.yaml
167
+ audyn/utils/driver/_conf_template/train/dataloader/sequential-batch.yaml
168
+ audyn/utils/driver/_conf_template/train/dataset/defaults.yaml
169
+ audyn/utils/driver/_conf_template/train/dataset/sortable-torch.yaml
170
+ audyn/utils/driver/_conf_template/train/dataset/torch.yaml
171
+ audyn/utils/driver/_conf_template/train/dataset/webdataset.yaml
172
+ audyn/utils/driver/_conf_template/train/record/defaults.yaml
173
+ audyn/utils/driver/_conf_template/train/record/template.yaml
174
+ audyn/utils/duration/__init__.py
175
+ audyn/utils/github/__init__.py
176
+ audyn/utils/hydra/__init__.py
177
+ audyn/utils/hydra/utils.py
178
+ audyn/utils/lab/__init__.py
179
+ audyn/utils/logging/__init__.py
180
+ audyn/utils/model/__init__.py
181
+ audyn/utils/music/__init__.py
182
+ audyn/utils/parallel/__init__.py
183
+ audyn/utils/tensorboard/__init__.py
184
+ audyn/utils/text/__init__.py
185
+ audyn/utils/text/indexing.py
186
+ audyn/utils/text/normalization.py
187
+ audyn/utils/text/pronunciation.py
188
+ audyn/utils/text/tokenization.py
189
+ audyn/utils/textgrid/__init__.py
190
+ cpp_extensions/monotonic_align/monotonic_align.cpp
@@ -6,12 +6,24 @@ torchaudio
6
6
  torchtext
7
7
  torchvision
8
8
  tensorboard
9
+ webdataset
10
+ inflect
11
+
12
+ [:python_version == "3.8"]
13
+ importlib_resources<6.2
9
14
 
10
15
  [dev]
11
16
  flake8
12
17
  black
13
18
  isort
14
19
 
20
+ [docs]
21
+ sphinx
22
+ sphinx-autodoc-typehints
23
+ sphinx-autobuild
24
+ nbsphinx
25
+ furo
26
+
15
27
  [recipes]
16
28
  tqdm
17
29
 
@@ -1,6 +1,7 @@
1
1
  exclude .gitignore
2
- exclude *.yaml
3
2
  recursive-include audyn *.py
3
+ recursive-include audyn *.yaml
4
4
  prune .github
5
+ prune docs
5
6
  prune tests
6
7
  prune recipes
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: Audyn
3
- Version: 0.0.1.dev1
3
+ Version: 0.0.1.dev6
4
4
  Summary: A PyTorch toolkit for audio synthesis.
5
5
  Author: Takuya Hasumi
6
6
  License: Apache License
@@ -209,6 +209,7 @@ Project-URL: url, https://github.com/tky823/Audyn
209
209
  Requires-Python: <4,>=3.8
210
210
  Description-Content-Type: text/markdown
211
211
  License-File: LICENSE
212
+ Requires-Dist: importlib_resources<6.2; python_version == "3.8"
212
213
  Requires-Dist: omegaconf
213
214
  Requires-Dist: hydra-core
214
215
  Requires-Dist: matplotlib
@@ -217,17 +218,27 @@ Requires-Dist: torchaudio
217
218
  Requires-Dist: torchtext
218
219
  Requires-Dist: torchvision
219
220
  Requires-Dist: tensorboard
221
+ Requires-Dist: webdataset
222
+ Requires-Dist: inflect
220
223
  Provides-Extra: recipes
221
224
  Requires-Dist: tqdm; extra == "recipes"
222
225
  Provides-Extra: dev
223
226
  Requires-Dist: flake8; extra == "dev"
224
227
  Requires-Dist: black; extra == "dev"
225
228
  Requires-Dist: isort; extra == "dev"
229
+ Provides-Extra: docs
230
+ Requires-Dist: sphinx; extra == "docs"
231
+ Requires-Dist: sphinx-autodoc-typehints; extra == "docs"
232
+ Requires-Dist: sphinx-autobuild; extra == "docs"
233
+ Requires-Dist: nbsphinx; extra == "docs"
234
+ Requires-Dist: furo; extra == "docs"
226
235
  Provides-Extra: tests
227
236
  Requires-Dist: pytest; extra == "tests"
228
237
  Requires-Dist: pytest-cov; extra == "tests"
229
238
 
230
239
  # Audyn
240
+ [![codecov](https://codecov.io/gh/tky823/Audyn/graph/badge.svg?token=7R29QDGXLQ)](https://codecov.io/gh/tky823/Audyn)
241
+
231
242
  Audyn is PyTorch toolkit for audio synthesis.
232
243
 
233
244
  ## Installation
@@ -248,12 +259,43 @@ If you need to run recipes, add `[recipes]` as follows:
248
259
  pip install -e ".[recipes]"
249
260
  ```
250
261
 
262
+ If you use MacOS, you may need to set `MACOSX_DEPLOYMENT_TARGET` during installation to build C++ related modules.
263
+
264
+ ### C++ extension
265
+ We use [C++ extension](https://pytorch.org/tutorials/advanced/cpp_extension.html) to search monotonic alignment in some models (e.g. GlowTTS).
266
+ To take full advantage of computational efficiency, set appropriate value of `OMP_NUM_THREADS` and `CXX` during installation:
267
+
268
+ ```shell
269
+ # In Audyn/
270
+ export CXX=<PATH/TO/CPP/COMPILER> # e.g. /usr/bin/c++
271
+ export OMP_NUM_THREADS=<SUITABLE/VALUE/FOR/ENVIRONMENT>
272
+ pip install -e "."
273
+ ```
274
+
251
275
  ## Development
252
276
  ```shell
253
277
  # In Audyn/
254
278
  pip install -e ".[recipes,dev,tests]"
255
279
  ```
256
280
 
281
+ ## Build Documentation Locally (optional)
282
+ To build the documentation locally, you have to include `docs` when installing `Audyn`.
283
+ ```shell
284
+ pip install -e ".[docs]"
285
+ ```
286
+
287
+ When you build the documentation, run the following command.
288
+ ```shell
289
+ cd docs/
290
+ make html
291
+ ```
292
+
293
+ Or, you can build the documentation automatically using `sphinx-autobuild`.
294
+ ```shell
295
+ # in Audyn/
296
+ sphinx-autobuild docs docs/_build/html
297
+ ```
298
+
257
299
  ## Test
258
300
  ```shell
259
301
  pytest tests/package
@@ -0,0 +1,64 @@
1
+ # Audyn
2
+ [![codecov](https://codecov.io/gh/tky823/Audyn/graph/badge.svg?token=7R29QDGXLQ)](https://codecov.io/gh/tky823/Audyn)
3
+
4
+ Audyn is PyTorch toolkit for audio synthesis.
5
+
6
+ ## Installation
7
+ You can install by pip.
8
+ ```shell
9
+ pip install git+https://github.com/tky823/Audyn.git
10
+ ```
11
+ or clone this repository.
12
+ ```shell
13
+ git clone https://github.com/tky823/Audyn.git
14
+ cd Audyn
15
+ pip install -e .
16
+ ```
17
+
18
+ If you need to run recipes, add `[recipes]` as follows:
19
+ ```shell
20
+ # In Audyn/
21
+ pip install -e ".[recipes]"
22
+ ```
23
+
24
+ If you use MacOS, you may need to set `MACOSX_DEPLOYMENT_TARGET` during installation to build C++ related modules.
25
+
26
+ ### C++ extension
27
+ We use [C++ extension](https://pytorch.org/tutorials/advanced/cpp_extension.html) to search monotonic alignment in some models (e.g. GlowTTS).
28
+ To take full advantage of computational efficiency, set appropriate value of `OMP_NUM_THREADS` and `CXX` during installation:
29
+
30
+ ```shell
31
+ # In Audyn/
32
+ export CXX=<PATH/TO/CPP/COMPILER> # e.g. /usr/bin/c++
33
+ export OMP_NUM_THREADS=<SUITABLE/VALUE/FOR/ENVIRONMENT>
34
+ pip install -e "."
35
+ ```
36
+
37
+ ## Development
38
+ ```shell
39
+ # In Audyn/
40
+ pip install -e ".[recipes,dev,tests]"
41
+ ```
42
+
43
+ ## Build Documentation Locally (optional)
44
+ To build the documentation locally, you have to include `docs` when installing `Audyn`.
45
+ ```shell
46
+ pip install -e ".[docs]"
47
+ ```
48
+
49
+ When you build the documentation, run the following command.
50
+ ```shell
51
+ cd docs/
52
+ make html
53
+ ```
54
+
55
+ Or, you can build the documentation automatically using `sphinx-autobuild`.
56
+ ```shell
57
+ # in Audyn/
58
+ sphinx-autobuild docs docs/_build/html
59
+ ```
60
+
61
+ ## Test
62
+ ```shell
63
+ pytest tests/package
64
+ ```
@@ -0,0 +1,61 @@
1
+ import importlib
2
+ import operator
3
+ import re
4
+ from typing import Any
5
+
6
+ from omegaconf import OmegaConf
7
+
8
+ from .utils.hydra import main
9
+
10
+ __all__ = ["__version__", "main"]
11
+
12
+ __version__ = "0.0.1.dev6"
13
+
14
+ # for resolver
15
+ _whitespace_re = re.compile(r"\s+")
16
+ _int_re = re.compile(r"^\d+$")
17
+ _float_re = re.compile(r"^[0-9]*\.?[0-9]+([eE][-+]?[0-9]+)?$")
18
+
19
+
20
+ def _constant_resolver(full_var_name: str) -> Any:
21
+ if "+" in full_var_name:
22
+ # TODO: generalize
23
+ # to support whitespace, e.g. ${const:audyn.utils.data.clotho.vocab_size + 1}
24
+ full_var_names = full_var_name.split("+")
25
+ resolved = _resolve(full_var_names[0])
26
+
27
+ for _full_var_name in full_var_names[1:]:
28
+ _full_var_name = _whitespace_re.sub("", _full_var_name)
29
+
30
+ if _int_re.match(_full_var_name):
31
+ _resolved = int(_full_var_name)
32
+ elif _float_re.match(_full_var_name):
33
+ _resolved = float(_full_var_name)
34
+ else:
35
+ raise ValueError(f"{_full_var_name} cannot be converted to int nor float.")
36
+
37
+ resolved = operator.add(resolved, _resolved)
38
+ else:
39
+ resolved = _resolve(full_var_name)
40
+
41
+ return resolved
42
+
43
+
44
+ def _resolve(full_var_name: str) -> Any:
45
+ full_var_name = full_var_name.strip()
46
+ mod_name, var_name = full_var_name.rsplit(".", maxsplit=1)
47
+
48
+ try:
49
+ resolved = getattr(importlib.import_module(mod_name), var_name)
50
+ except ModuleNotFoundError:
51
+ # TODO: generalize
52
+ attr_name = var_name
53
+ mod_name, var_name = mod_name.rsplit(".", maxsplit=1)
54
+ imported_module = importlib.import_module(mod_name)
55
+ cls = getattr(imported_module, var_name)
56
+ resolved = getattr(cls, attr_name)
57
+
58
+ return resolved
59
+
60
+
61
+ OmegaConf.register_new_resolver("const", _constant_resolver)
@@ -0,0 +1,6 @@
1
+ from .base import BaseCriterionWrapper, MultiCriteria
2
+
3
+ __all__ = [
4
+ "BaseCriterionWrapper",
5
+ "MultiCriteria",
6
+ ]
@@ -30,13 +30,13 @@ class MultiCriteria(nn.ModuleDict):
30
30
 
31
31
  Examples:
32
32
 
33
- >>> import hydra
33
+ >>> import audyn
34
34
  >>> import torch
35
35
  >>> torch.manual_seed(0)
36
36
  >>> config = {
37
- ... "_target_": "audyn.criterion.base.MultiCriteria",
37
+ ... "_target_": "audyn.criterion.MultiCriteria",
38
38
  ... "mse": {
39
- ... "_target_": "audyn.criterion.base.BaseCriterionWrapper",
39
+ ... "_target_": "audyn.criterion.BaseCriterionWrapper",
40
40
  ... "criterion": {
41
41
  ... "_target_": "torch.nn.MSELoss",
42
42
  ... "reduction": "mean",
@@ -52,7 +52,7 @@ class MultiCriteria(nn.ModuleDict):
52
52
  ... }
53
53
  ... },
54
54
  ... "mae": {
55
- ... "_target_": "audyn.criterion.base.BaseCriterionWrapper",
55
+ ... "_target_": "audyn.criterion.BaseCriterionWrapper",
56
56
  ... "criterion": {
57
57
  ... "_target_": "torch.nn.L1Loss",
58
58
  ... "reduction": "mean",
@@ -68,7 +68,7 @@ class MultiCriteria(nn.ModuleDict):
68
68
  ... }
69
69
  ... }
70
70
  >>> }
71
- >>> criterion = hydra.utils.instantiate(config)
71
+ >>> criterion = audyn.utils.instantiate_criterion(config)
72
72
  >>> y = torch.randn((4,))
73
73
  >>> t_mse = torch.randn_like(y)
74
74
  >>> t_mae = torch.randn_like(y)