rxnn 0.1.30__tar.gz → 0.1.31__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (31) hide show
  1. {rxnn-0.1.30 → rxnn-0.1.31}/PKG-INFO +1 -1
  2. {rxnn-0.1.30 → rxnn-0.1.31}/pyproject.toml +1 -1
  3. {rxnn-0.1.30 → rxnn-0.1.31}/src/rxnn/experimental/attention.py +10 -0
  4. {rxnn-0.1.30 → rxnn-0.1.31}/LICENSE +0 -0
  5. {rxnn-0.1.30 → rxnn-0.1.31}/README.md +0 -0
  6. {rxnn-0.1.30 → rxnn-0.1.31}/src/rxnn/__init__.py +0 -0
  7. {rxnn-0.1.30 → rxnn-0.1.31}/src/rxnn/experimental/__init__.py +0 -0
  8. {rxnn-0.1.30 → rxnn-0.1.31}/src/rxnn/experimental/models.py +0 -0
  9. {rxnn-0.1.30 → rxnn-0.1.31}/src/rxnn/experimental/moe.py +0 -0
  10. {rxnn-0.1.30 → rxnn-0.1.31}/src/rxnn/memory/__init__.py +0 -0
  11. {rxnn-0.1.30 → rxnn-0.1.31}/src/rxnn/memory/norm.py +0 -0
  12. {rxnn-0.1.30 → rxnn-0.1.31}/src/rxnn/memory/stm.py +0 -0
  13. {rxnn-0.1.30 → rxnn-0.1.31}/src/rxnn/rxt/__init__.py +0 -0
  14. {rxnn-0.1.30 → rxnn-0.1.31}/src/rxnn/rxt/models.py +0 -0
  15. {rxnn-0.1.30 → rxnn-0.1.31}/src/rxnn/training/__init__.py +0 -0
  16. {rxnn-0.1.30 → rxnn-0.1.31}/src/rxnn/training/base.py +0 -0
  17. {rxnn-0.1.30 → rxnn-0.1.31}/src/rxnn/training/bml.py +0 -0
  18. {rxnn-0.1.30 → rxnn-0.1.31}/src/rxnn/training/callbacks.py +0 -0
  19. {rxnn-0.1.30 → rxnn-0.1.31}/src/rxnn/training/dataset.py +0 -0
  20. {rxnn-0.1.30 → rxnn-0.1.31}/src/rxnn/training/scheduler.py +0 -0
  21. {rxnn-0.1.30 → rxnn-0.1.31}/src/rxnn/training/tokenizer.py +0 -0
  22. {rxnn-0.1.30 → rxnn-0.1.31}/src/rxnn/transformers/__init__.py +0 -0
  23. {rxnn-0.1.30 → rxnn-0.1.31}/src/rxnn/transformers/attention.py +0 -0
  24. {rxnn-0.1.30 → rxnn-0.1.31}/src/rxnn/transformers/ff.py +0 -0
  25. {rxnn-0.1.30 → rxnn-0.1.31}/src/rxnn/transformers/layers.py +0 -0
  26. {rxnn-0.1.30 → rxnn-0.1.31}/src/rxnn/transformers/mask.py +0 -0
  27. {rxnn-0.1.30 → rxnn-0.1.31}/src/rxnn/transformers/models.py +0 -0
  28. {rxnn-0.1.30 → rxnn-0.1.31}/src/rxnn/transformers/moe.py +0 -0
  29. {rxnn-0.1.30 → rxnn-0.1.31}/src/rxnn/transformers/positional.py +0 -0
  30. {rxnn-0.1.30 → rxnn-0.1.31}/src/rxnn/transformers/sampler.py +0 -0
  31. {rxnn-0.1.30 → rxnn-0.1.31}/src/rxnn/utils.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.3
2
2
  Name: rxnn
3
- Version: 0.1.30
3
+ Version: 0.1.31
4
4
  Summary: RxNN: Reactive Neural Networks Platform
5
5
  License: Apache-2.0
6
6
  Keywords: deep-learning,ai,machine-learning
@@ -4,7 +4,7 @@ build-backend = "poetry.core.masonry.api"
4
4
 
5
5
  [tool.poetry]
6
6
  name = "rxnn"
7
- version = "0.1.30"
7
+ version = "0.1.31"
8
8
  description = "RxNN: Reactive Neural Networks Platform"
9
9
 
10
10
  license = "Apache-2.0"
@@ -337,16 +337,26 @@ class GroupedMoeAttentionVectorized(GroupedQueryAttention):
337
337
  k_all = k_all.view(B, S, self.num_experts, -1)
338
338
  v_all = v_all.view(B, S, self.num_experts, -1)
339
339
 
340
+ print('k_all', k_all.size())
341
+ print('v_all', v_all.size())
342
+
343
+
340
344
  # Gather top-k experts and weights
341
345
  # Expand indices to [B, S, num_groups, head_dim]
342
346
  expanded_indices = indices.unsqueeze(-1).expand(-1, -1, -1, k_all.size(-1))
343
347
  selected_k = torch.gather(k_all, 2, expanded_indices) # [B, S, num_groups, head_dim]
344
348
  selected_v = torch.gather(v_all, 2, expanded_indices)
345
349
 
350
+ print('selected_k', selected_k.size())
351
+ print('selected_v', selected_v.size())
352
+
346
353
  # Weighted sum
347
354
  weighted_k = (selected_k * weights).sum(dim=2) # [B, S, head_dim]
348
355
  weighted_v = (selected_v * weights).sum(dim=2)
349
356
 
357
+ print('weighted_k', weighted_k.size())
358
+ print('weighted_v', weighted_v.size())
359
+
350
360
  # Reshape to GQA format
351
361
  k = weighted_k.view(B, S, self.num_groups, -1).permute(0, 2, 1, 3) # [B, G, S, head_dim]
352
362
  v = weighted_v.view(B, S, self.num_groups, -1).permute(0, 2, 1, 3)
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes