rxnn 0.1.20__tar.gz → 0.1.21__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (31) hide show
  1. {rxnn-0.1.20 → rxnn-0.1.21}/PKG-INFO +1 -1
  2. {rxnn-0.1.20 → rxnn-0.1.21}/pyproject.toml +1 -1
  3. {rxnn-0.1.20 → rxnn-0.1.21}/src/rxnn/experimental/attention.py +7 -0
  4. {rxnn-0.1.20 → rxnn-0.1.21}/LICENSE +0 -0
  5. {rxnn-0.1.20 → rxnn-0.1.21}/README.md +0 -0
  6. {rxnn-0.1.20 → rxnn-0.1.21}/src/rxnn/__init__.py +0 -0
  7. {rxnn-0.1.20 → rxnn-0.1.21}/src/rxnn/experimental/__init__.py +0 -0
  8. {rxnn-0.1.20 → rxnn-0.1.21}/src/rxnn/experimental/models.py +0 -0
  9. {rxnn-0.1.20 → rxnn-0.1.21}/src/rxnn/experimental/moe.py +0 -0
  10. {rxnn-0.1.20 → rxnn-0.1.21}/src/rxnn/memory/__init__.py +0 -0
  11. {rxnn-0.1.20 → rxnn-0.1.21}/src/rxnn/memory/norm.py +0 -0
  12. {rxnn-0.1.20 → rxnn-0.1.21}/src/rxnn/memory/stm.py +0 -0
  13. {rxnn-0.1.20 → rxnn-0.1.21}/src/rxnn/rxt/__init__.py +0 -0
  14. {rxnn-0.1.20 → rxnn-0.1.21}/src/rxnn/rxt/models.py +0 -0
  15. {rxnn-0.1.20 → rxnn-0.1.21}/src/rxnn/training/__init__.py +0 -0
  16. {rxnn-0.1.20 → rxnn-0.1.21}/src/rxnn/training/base.py +0 -0
  17. {rxnn-0.1.20 → rxnn-0.1.21}/src/rxnn/training/bml.py +0 -0
  18. {rxnn-0.1.20 → rxnn-0.1.21}/src/rxnn/training/callbacks.py +0 -0
  19. {rxnn-0.1.20 → rxnn-0.1.21}/src/rxnn/training/dataset.py +0 -0
  20. {rxnn-0.1.20 → rxnn-0.1.21}/src/rxnn/training/scheduler.py +0 -0
  21. {rxnn-0.1.20 → rxnn-0.1.21}/src/rxnn/training/tokenizer.py +0 -0
  22. {rxnn-0.1.20 → rxnn-0.1.21}/src/rxnn/transformers/__init__.py +0 -0
  23. {rxnn-0.1.20 → rxnn-0.1.21}/src/rxnn/transformers/attention.py +0 -0
  24. {rxnn-0.1.20 → rxnn-0.1.21}/src/rxnn/transformers/ff.py +0 -0
  25. {rxnn-0.1.20 → rxnn-0.1.21}/src/rxnn/transformers/layers.py +0 -0
  26. {rxnn-0.1.20 → rxnn-0.1.21}/src/rxnn/transformers/mask.py +0 -0
  27. {rxnn-0.1.20 → rxnn-0.1.21}/src/rxnn/transformers/models.py +0 -0
  28. {rxnn-0.1.20 → rxnn-0.1.21}/src/rxnn/transformers/moe.py +0 -0
  29. {rxnn-0.1.20 → rxnn-0.1.21}/src/rxnn/transformers/positional.py +0 -0
  30. {rxnn-0.1.20 → rxnn-0.1.21}/src/rxnn/transformers/sampler.py +0 -0
  31. {rxnn-0.1.20 → rxnn-0.1.21}/src/rxnn/utils.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.3
2
2
  Name: rxnn
3
- Version: 0.1.20
3
+ Version: 0.1.21
4
4
  Summary: RxNN: Reactive Neural Networks Platform
5
5
  License: Apache-2.0
6
6
  Keywords: deep-learning,ai,machine-learning
@@ -4,7 +4,7 @@ build-backend = "poetry.core.masonry.api"
4
4
 
5
5
  [tool.poetry]
6
6
  name = "rxnn"
7
- version = "0.1.20"
7
+ version = "0.1.21"
8
8
  description = "RxNN: Reactive Neural Networks Platform"
9
9
 
10
10
  license = "Apache-2.0"
@@ -125,6 +125,9 @@ class GroupedMoeAttention(GroupedQueryAttention):
125
125
  k = self._process_grouped_experts(key, self.wk, self.bk, weights_k, indices_k)
126
126
  v = self._process_grouped_experts(value, self.wv, self.bv, weights_k, indices_k)
127
127
 
128
+ print('processed k', k.size())
129
+ print('processed v', v.size())
130
+
128
131
  # Expand to GQA format
129
132
  k = k.permute(0, 2, 1, 3).reshape(B, self.num_groups, S, -1)
130
133
  v = v.permute(0, 2, 1, 3).reshape(B, self.num_groups, S, -1)
@@ -138,6 +141,10 @@ class GroupedMoeAttention(GroupedQueryAttention):
138
141
  k = k.flatten(start_dim=1, end_dim=2) # (B, H, S, head_dim)
139
142
  v = v.flatten(start_dim=1, end_dim=2) # (B, H, S, head_dim)
140
143
 
144
+ print('q', q.size())
145
+ print('k', k.size())
146
+ print('v', v.size())
147
+
141
148
  return q, k, v
142
149
 
143
150
 
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes