rxnn 0.1.29__py3-none-any.whl → 0.1.30__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
rxnn/experimental/attention.py
CHANGED
@@ -319,7 +319,7 @@ class GroupedMoeAttentionVectorized(GroupedQueryAttention):
|
|
319
319
|
head_dim = d // self.num_heads
|
320
320
|
|
321
321
|
# Process Query as in GQA
|
322
|
-
q = self.q_proj(query).view(b, t, self.num_heads, -1).transpose(1, 2)
|
322
|
+
q = self.q_proj(query).view(b, t, self.num_heads, -1).transpose(1, 2) if not skip_query_processing else query
|
323
323
|
|
324
324
|
# Key/Value MoE routing
|
325
325
|
B, S, D = key.shape
|
@@ -360,6 +360,10 @@ class GroupedMoeAttentionVectorized(GroupedQueryAttention):
|
|
360
360
|
k = k.flatten(start_dim=1, end_dim=2) # (B, H, S, head_dim)
|
361
361
|
v = v.flatten(start_dim=1, end_dim=2) # (B, H, S, head_dim)
|
362
362
|
|
363
|
+
print('q', q.size())
|
364
|
+
print('k', k.size())
|
365
|
+
print('v', v.size())
|
366
|
+
|
363
367
|
return q, k, v
|
364
368
|
|
365
369
|
|
@@ -1,6 +1,6 @@
|
|
1
1
|
rxnn/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
2
2
|
rxnn/experimental/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
3
|
-
rxnn/experimental/attention.py,sha256=
|
3
|
+
rxnn/experimental/attention.py,sha256=dOhnHYknVMiw4kIfaWo08ycz1Kl5KfFAHfZEVljs2n0,29567
|
4
4
|
rxnn/experimental/models.py,sha256=QEuFBB9iEg5AbKQLwGJkAwPjMfaVeTqazhKDWPRkm7o,4598
|
5
5
|
rxnn/experimental/moe.py,sha256=PhiaNr3FwR2Zv2a0tfj6sfZ4iyhLo3Jyp2DwXq19qZQ,7935
|
6
6
|
rxnn/memory/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
@@ -25,7 +25,7 @@ rxnn/transformers/moe.py,sha256=6Cffyo0QjmEWc4rK1ncOmLRCQbY0OpQJ4D7xH_4nTN4,4738
|
|
25
25
|
rxnn/transformers/positional.py,sha256=2l38RS0Dini3f6Z3LUHr3XwWzg1UK7fO2C6wazWDAYU,4292
|
26
26
|
rxnn/transformers/sampler.py,sha256=poWBpxg1iuK5gEJtxHkk5VVfS9V48hs2Olqdhy_Gw8c,6548
|
27
27
|
rxnn/utils.py,sha256=d5U8i5ukovgDyqiycc2AoxObTz_eF_bgo2MKvdtJ98s,467
|
28
|
-
rxnn-0.1.
|
29
|
-
rxnn-0.1.
|
30
|
-
rxnn-0.1.
|
31
|
-
rxnn-0.1.
|
28
|
+
rxnn-0.1.30.dist-info/LICENSE,sha256=C8coDFIUYuOcke4JLPwTqahQUCyXyGq6WOaigOkx8tY,11275
|
29
|
+
rxnn-0.1.30.dist-info/METADATA,sha256=E5ScN8-I6sP22N80oe7QhLeszz6w9L3UcBN2GCTfu7Q,16627
|
30
|
+
rxnn-0.1.30.dist-info/WHEEL,sha256=fGIA9gx4Qxk2KDKeNJCbOEwSrmLtjWCwzBz351GyrPQ,88
|
31
|
+
rxnn-0.1.30.dist-info/RECORD,,
|
File without changes
|
File without changes
|