qwen-tts 0.0.5__py3-none-any.whl → 0.1.0__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- qwen_tts/core/models/modeling_qwen3_tts.py +8 -3
- qwen_tts/core/tokenizer_12hz/modeling_qwen3_tts_tokenizer_v2.py +4 -3
- {qwen_tts-0.0.5.dist-info → qwen_tts-0.1.0.dist-info}/METADATA +7 -1
- {qwen_tts-0.0.5.dist-info → qwen_tts-0.1.0.dist-info}/RECORD +8 -8
- {qwen_tts-0.0.5.dist-info → qwen_tts-0.1.0.dist-info}/WHEEL +1 -1
- {qwen_tts-0.0.5.dist-info → qwen_tts-0.1.0.dist-info}/entry_points.txt +0 -0
- {qwen_tts-0.0.5.dist-info → qwen_tts-0.1.0.dist-info}/licenses/LICENSE +0 -0
- {qwen_tts-0.0.5.dist-info → qwen_tts-0.1.0.dist-info}/top_level.txt +0 -0
|
@@ -470,7 +470,7 @@ class Qwen3TTSPreTrainedModel(PreTrainedModel):
|
|
|
470
470
|
supports_gradient_checkpointing = True
|
|
471
471
|
_no_split_modules = ["Qwen3TTSDecoderLayer"]
|
|
472
472
|
_skip_keys_device_placement = "past_key_values"
|
|
473
|
-
|
|
473
|
+
_supports_flash_attn = True
|
|
474
474
|
_supports_sdpa = True
|
|
475
475
|
_supports_cache_class = True
|
|
476
476
|
_supports_static_cache = False
|
|
@@ -501,8 +501,7 @@ class Qwen3TTSTalkerTextPreTrainedModel(PreTrainedModel):
|
|
|
501
501
|
supports_gradient_checkpointing = True
|
|
502
502
|
_no_split_modules = []
|
|
503
503
|
_skip_keys_device_placement = ["past_key_values"]
|
|
504
|
-
|
|
505
|
-
_supports_flash_attn_2 = True
|
|
504
|
+
_supports_flash_attn = True
|
|
506
505
|
_supports_sdpa = True
|
|
507
506
|
_supports_flex_attn = True
|
|
508
507
|
_supports_cache_class = True
|
|
@@ -1869,6 +1868,11 @@ class Qwen3TTSForConditionalGeneration(Qwen3TTSPreTrainedModel, GenerationMixin)
|
|
|
1869
1868
|
weights_only=True,
|
|
1870
1869
|
**kwargs,
|
|
1871
1870
|
):
|
|
1871
|
+
# Hotfix to enable passing the correct attn implementation which is stored in the config but not in kwargs
|
|
1872
|
+
requested_attn_implementation = kwargs.pop("attn_implementation", None)
|
|
1873
|
+
if requested_attn_implementation is None and config and config._attn_implementation:
|
|
1874
|
+
requested_attn_implementation = config._attn_implementation
|
|
1875
|
+
|
|
1872
1876
|
model = super().from_pretrained(
|
|
1873
1877
|
pretrained_model_name_or_path,
|
|
1874
1878
|
*model_args,
|
|
@@ -1881,6 +1885,7 @@ class Qwen3TTSForConditionalGeneration(Qwen3TTSPreTrainedModel, GenerationMixin)
|
|
|
1881
1885
|
revision=revision,
|
|
1882
1886
|
use_safetensors=use_safetensors,
|
|
1883
1887
|
weights_only=weights_only,
|
|
1888
|
+
attn_implementation=requested_attn_implementation,
|
|
1884
1889
|
**kwargs,
|
|
1885
1890
|
)
|
|
1886
1891
|
if not local_files_only and not os.path.isdir(pretrained_model_name_or_path):
|
|
@@ -198,12 +198,13 @@ class Qwen3TTSTokenizerV2CausalTransConvNet(nn.Module):
|
|
|
198
198
|
self.conv = nn.ConvTranspose1d(in_channels, out_channels, kernel_size, stride=stride)
|
|
199
199
|
|
|
200
200
|
pad = kernel_size - stride
|
|
201
|
-
self.left_pad =
|
|
202
|
-
self.right_pad = pad
|
|
201
|
+
self.left_pad = 0
|
|
202
|
+
self.right_pad = int(pad)
|
|
203
203
|
|
|
204
204
|
def forward(self, hidden_state):
|
|
205
205
|
hidden_state = self.conv(hidden_state)
|
|
206
|
-
|
|
206
|
+
if self.right_pad > 0:
|
|
207
|
+
hidden_state = hidden_state[..., : hidden_state.shape[-1] - self.right_pad]
|
|
207
208
|
return hidden_state.contiguous()
|
|
208
209
|
|
|
209
210
|
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: qwen-tts
|
|
3
|
-
Version: 0.0
|
|
3
|
+
Version: 0.1.0
|
|
4
4
|
Summary: Qwen-TTS python package
|
|
5
5
|
Author: Alibaba Qwen Team
|
|
6
6
|
License: Apache-2.0
|
|
@@ -1380,4 +1380,10 @@ If you find our paper and code useful in your research, please consider giving a
|
|
|
1380
1380
|
}
|
|
1381
1381
|
```
|
|
1382
1382
|
|
|
1383
|
+
|
|
1384
|
+
## Star History
|
|
1385
|
+
|
|
1386
|
+
[](https://star-history.com/#QwenLM/Qwen3-TTS&Date)
|
|
1387
|
+
|
|
1388
|
+
|
|
1383
1389
|
<br>
|
|
@@ -4,10 +4,10 @@ qwen_tts/cli/demo.py,sha256=6ijgkwdT4Fy91Tq3vZC3voGrhZVJkCdx2xXws6v81es,29160
|
|
|
4
4
|
qwen_tts/core/__init__.py,sha256=GzgNnehDttWF2TjDOdBmE2VnynElQSZ0I0IEr0OGZ54,990
|
|
5
5
|
qwen_tts/core/models/__init__.py,sha256=kX042P1-2E3nNwP9I5TVNcpBbhVpTR5QMk5KBtQCLII,807
|
|
6
6
|
qwen_tts/core/models/configuration_qwen3_tts.py,sha256=9Shn8U_eBqQW3RSGTVA85tE9CgjV9dowGR4cgME_XRg,26428
|
|
7
|
-
qwen_tts/core/models/modeling_qwen3_tts.py,sha256=
|
|
7
|
+
qwen_tts/core/models/modeling_qwen3_tts.py,sha256=JcQmVrz4EPBu9rwYOb1wg_PIz-2sOhR8QGC0JisclqA,100211
|
|
8
8
|
qwen_tts/core/models/processing_qwen3_tts.py,sha256=YUciAxiORu2mjXQMJfDyKOziSmHs-ULlfW5J54tNa80,4022
|
|
9
9
|
qwen_tts/core/tokenizer_12hz/configuration_qwen3_tts_tokenizer_v2.py,sha256=njDCQ5SwDLA2bX2jSCt0NkaKzBzT2hpv5hSh00ZTpeM,7946
|
|
10
|
-
qwen_tts/core/tokenizer_12hz/modeling_qwen3_tts_tokenizer_v2.py,sha256=
|
|
10
|
+
qwen_tts/core/tokenizer_12hz/modeling_qwen3_tts_tokenizer_v2.py,sha256=OT_C6mD12rlnjYMJqHyT_t1idNDrFieXoEttbamaSJs,40464
|
|
11
11
|
qwen_tts/core/tokenizer_25hz/configuration_qwen3_tts_tokenizer_v1.py,sha256=KPlPcV332W02XJzqACHZzKjGPS9I9IQjxDo9PK4o7wI,14494
|
|
12
12
|
qwen_tts/core/tokenizer_25hz/modeling_qwen3_tts_tokenizer_v1.py,sha256=SdXRMvkR2uW8Fa_FzvRicu3nw4FzTHnCSLkUmfxBPF0,56472
|
|
13
13
|
qwen_tts/core/tokenizer_25hz/vq/core_vq.py,sha256=01-p8A70hjNhST4QL04o8JJIhJcRffWAgZ6Ttd_zuN4,20074
|
|
@@ -16,9 +16,9 @@ qwen_tts/core/tokenizer_25hz/vq/whisper_encoder.py,sha256=oXSLNJaLqO_-v5AsSkOZlB
|
|
|
16
16
|
qwen_tts/core/tokenizer_25hz/vq/assets/mel_filters.npz,sha256=dFCucHI6XvnTQePO5ijHywF382zkLES37SvzMl8PbUw,4271
|
|
17
17
|
qwen_tts/inference/qwen3_tts_model.py,sha256=4dpFBzKFfB9f4-NuurhdsvbcakjKr_aXP0YzhOMCdeQ,37121
|
|
18
18
|
qwen_tts/inference/qwen3_tts_tokenizer.py,sha256=vX1-6_rJIGQ7QtKd932ngHJYvEBjBUSos1tCEtOyFaw,15698
|
|
19
|
-
qwen_tts-0.0.
|
|
20
|
-
qwen_tts-0.0.
|
|
21
|
-
qwen_tts-0.0.
|
|
22
|
-
qwen_tts-0.0.
|
|
23
|
-
qwen_tts-0.0.
|
|
24
|
-
qwen_tts-0.0.
|
|
19
|
+
qwen_tts-0.1.0.dist-info/licenses/LICENSE,sha256=pEpggcc6118CVbsrtcq3TvGClWWolaJOU6TxEpCrdlU,11343
|
|
20
|
+
qwen_tts-0.1.0.dist-info/METADATA,sha256=qIoqgk0JBnvOKTWCh0ijBaECdDTAJHdkf5DhQwaRTPg,61393
|
|
21
|
+
qwen_tts-0.1.0.dist-info/WHEEL,sha256=wUyA8OaulRlbfwMtmQsvNngGrxQHAvkKcvRmdizlJi0,92
|
|
22
|
+
qwen_tts-0.1.0.dist-info/entry_points.txt,sha256=hcoVetKUabLdCmu2ST4jGo8jilnoslpFzV-bxlHf0E0,57
|
|
23
|
+
qwen_tts-0.1.0.dist-info/top_level.txt,sha256=1o-44WiYkUtYVTiL9eexzyNQXK6YWCOGZltO81PUirA,9
|
|
24
|
+
qwen_tts-0.1.0.dist-info/RECORD,,
|
|
File without changes
|
|
File without changes
|
|
File without changes
|