diffsynth-engine 0.6.1.dev1__py3-none-any.whl → 0.6.1.dev2__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- diffsynth_engine/models/wan/wan_text_encoder.py +13 -13
- {diffsynth_engine-0.6.1.dev1.dist-info → diffsynth_engine-0.6.1.dev2.dist-info}/METADATA +1 -1
- {diffsynth_engine-0.6.1.dev1.dist-info → diffsynth_engine-0.6.1.dev2.dist-info}/RECORD +6 -6
- {diffsynth_engine-0.6.1.dev1.dist-info → diffsynth_engine-0.6.1.dev2.dist-info}/WHEEL +0 -0
- {diffsynth_engine-0.6.1.dev1.dist-info → diffsynth_engine-0.6.1.dev2.dist-info}/licenses/LICENSE +0 -0
- {diffsynth_engine-0.6.1.dev1.dist-info → diffsynth_engine-0.6.1.dev2.dist-info}/top_level.txt +0 -0
|
@@ -198,22 +198,22 @@ class WanTextEncoderStateDictConverter(StateDictConverter):
|
|
|
198
198
|
|
|
199
199
|
def _from_diffusers(self, state_dict):
|
|
200
200
|
rename_dict = {
|
|
201
|
-
"
|
|
202
|
-
"
|
|
201
|
+
"shared.weight": "token_embedding.weight",
|
|
202
|
+
"encoder.final_layer_norm.weight": "norm.weight",
|
|
203
203
|
}
|
|
204
204
|
for i in range(self.num_encoder_layers):
|
|
205
205
|
rename_dict.update(
|
|
206
206
|
{
|
|
207
|
-
f"
|
|
208
|
-
f"
|
|
209
|
-
f"
|
|
210
|
-
f"
|
|
211
|
-
f"
|
|
212
|
-
f"
|
|
213
|
-
f"
|
|
214
|
-
f"
|
|
215
|
-
f"
|
|
216
|
-
f"
|
|
207
|
+
f"encoder.block.{i}.layer.0.SelfAttention.q.weight": f"blocks.{i}.attn.q.weight",
|
|
208
|
+
f"encoder.block.{i}.layer.0.SelfAttention.k.weight": f"blocks.{i}.attn.k.weight",
|
|
209
|
+
f"encoder.block.{i}.layer.0.SelfAttention.v.weight": f"blocks.{i}.attn.v.weight",
|
|
210
|
+
f"encoder.block.{i}.layer.0.SelfAttention.o.weight": f"blocks.{i}.attn.o.weight",
|
|
211
|
+
f"encoder.block.{i}.layer.0.SelfAttention.relative_attention_bias.weight": f"blocks.{i}.pos_embedding.embedding.weight",
|
|
212
|
+
f"encoder.block.{i}.layer.0.layer_norm.weight": f"blocks.{i}.norm1.weight",
|
|
213
|
+
f"encoder.block.{i}.layer.1.DenseReluDense.wi_0.weight": f"blocks.{i}.ffn.gate.0.weight",
|
|
214
|
+
f"encoder.block.{i}.layer.1.DenseReluDense.wi_1.weight": f"blocks.{i}.ffn.fc1.weight",
|
|
215
|
+
f"encoder.block.{i}.layer.1.DenseReluDense.wo.weight": f"blocks.{i}.ffn.fc2.weight",
|
|
216
|
+
f"encoder.block.{i}.layer.1.layer_norm.weight": f"blocks.{i}.norm2.weight",
|
|
217
217
|
}
|
|
218
218
|
)
|
|
219
219
|
|
|
@@ -224,7 +224,7 @@ class WanTextEncoderStateDictConverter(StateDictConverter):
|
|
|
224
224
|
return new_state_dict
|
|
225
225
|
|
|
226
226
|
def convert(self, state_dict):
|
|
227
|
-
if "
|
|
227
|
+
if "encoder.final_layer_norm.weight" in state_dict:
|
|
228
228
|
logger.info("use diffusers format state dict")
|
|
229
229
|
return self._from_diffusers(state_dict)
|
|
230
230
|
return state_dict
|
|
@@ -136,7 +136,7 @@ diffsynth_engine/models/wan/wan_audio_encoder.py,sha256=W7sUo3Fse33MNsZTYiYYEe0Y
|
|
|
136
136
|
diffsynth_engine/models/wan/wan_dit.py,sha256=ocCAYl3xP0UdB9dhz9R1pRfBBESEHxDUu116hORe39U,20080
|
|
137
137
|
diffsynth_engine/models/wan/wan_image_encoder.py,sha256=VE7crdTxOFN2UCMN2cQlvHB9BilSbKOBQYgnXgl4E2Y,14313
|
|
138
138
|
diffsynth_engine/models/wan/wan_s2v_dit.py,sha256=sOJsSs1snI-ZGPJS8utstmgj0wcYwloyZ0C14hQHFkg,23597
|
|
139
|
-
diffsynth_engine/models/wan/wan_text_encoder.py,sha256=
|
|
139
|
+
diffsynth_engine/models/wan/wan_text_encoder.py,sha256=OERlmwOqthAFPNnnT2sXJ4OjyyRmsRLx7VGp1zlBkLU,11021
|
|
140
140
|
diffsynth_engine/models/wan/wan_vae.py,sha256=ogXrVlwmzXR4iLxjSCkBPtYW8KWebnvvd2UtPZeoziY,38853
|
|
141
141
|
diffsynth_engine/pipelines/__init__.py,sha256=jh-4LSJ0vqlXiT8BgFgRIQxuAr2atEPyHrxXWj-Ud1U,604
|
|
142
142
|
diffsynth_engine/pipelines/base.py,sha256=RTkVwWaWXr5ujqn5-UBHvdPddYwr-uvChj9-fmoXrms,13729
|
|
@@ -185,8 +185,8 @@ diffsynth_engine/utils/video.py,sha256=GoMyc2as4_VqfWX4pjQyAWh9QObsFMov42zADVZNa
|
|
|
185
185
|
diffsynth_engine/utils/memory/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
186
186
|
diffsynth_engine/utils/memory/linear_regression.py,sha256=oW_EQEw13oPoyUrxiL8A7Ksa5AuJ2ynI2qhCbfAuZbg,3930
|
|
187
187
|
diffsynth_engine/utils/memory/memory_predcit_model.py,sha256=EXprSl_zlVjgfMWNXP-iw83Ot3hyMcgYaRPv-dvyL84,3943
|
|
188
|
-
diffsynth_engine-0.6.1.
|
|
189
|
-
diffsynth_engine-0.6.1.
|
|
190
|
-
diffsynth_engine-0.6.1.
|
|
191
|
-
diffsynth_engine-0.6.1.
|
|
192
|
-
diffsynth_engine-0.6.1.
|
|
188
|
+
diffsynth_engine-0.6.1.dev2.dist-info/licenses/LICENSE,sha256=x7aBqQuVI0IYnftgoTPI_A0I_rjdjPPQkjnU6N2nikM,11346
|
|
189
|
+
diffsynth_engine-0.6.1.dev2.dist-info/METADATA,sha256=6bwBcpLV0q3yBPFYlDecEtAJP1ga-zi7u9tioW41D7k,1163
|
|
190
|
+
diffsynth_engine-0.6.1.dev2.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
|
|
191
|
+
diffsynth_engine-0.6.1.dev2.dist-info/top_level.txt,sha256=6zgbiIzEHLbhgDKRyX0uBJOV3F6VnGGBRIQvSiYYn6w,17
|
|
192
|
+
diffsynth_engine-0.6.1.dev2.dist-info/RECORD,,
|
|
File without changes
|
{diffsynth_engine-0.6.1.dev1.dist-info → diffsynth_engine-0.6.1.dev2.dist-info}/licenses/LICENSE
RENAMED
|
File without changes
|
{diffsynth_engine-0.6.1.dev1.dist-info → diffsynth_engine-0.6.1.dev2.dist-info}/top_level.txt
RENAMED
|
File without changes
|