rxnn 0.1.21__tar.gz → 0.1.22__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (31) hide show
  1. {rxnn-0.1.21 → rxnn-0.1.22}/PKG-INFO +1 -1
  2. {rxnn-0.1.21 → rxnn-0.1.22}/pyproject.toml +1 -1
  3. {rxnn-0.1.21 → rxnn-0.1.22}/src/rxnn/experimental/attention.py +2 -1
  4. {rxnn-0.1.21 → rxnn-0.1.22}/LICENSE +0 -0
  5. {rxnn-0.1.21 → rxnn-0.1.22}/README.md +0 -0
  6. {rxnn-0.1.21 → rxnn-0.1.22}/src/rxnn/__init__.py +0 -0
  7. {rxnn-0.1.21 → rxnn-0.1.22}/src/rxnn/experimental/__init__.py +0 -0
  8. {rxnn-0.1.21 → rxnn-0.1.22}/src/rxnn/experimental/models.py +0 -0
  9. {rxnn-0.1.21 → rxnn-0.1.22}/src/rxnn/experimental/moe.py +0 -0
  10. {rxnn-0.1.21 → rxnn-0.1.22}/src/rxnn/memory/__init__.py +0 -0
  11. {rxnn-0.1.21 → rxnn-0.1.22}/src/rxnn/memory/norm.py +0 -0
  12. {rxnn-0.1.21 → rxnn-0.1.22}/src/rxnn/memory/stm.py +0 -0
  13. {rxnn-0.1.21 → rxnn-0.1.22}/src/rxnn/rxt/__init__.py +0 -0
  14. {rxnn-0.1.21 → rxnn-0.1.22}/src/rxnn/rxt/models.py +0 -0
  15. {rxnn-0.1.21 → rxnn-0.1.22}/src/rxnn/training/__init__.py +0 -0
  16. {rxnn-0.1.21 → rxnn-0.1.22}/src/rxnn/training/base.py +0 -0
  17. {rxnn-0.1.21 → rxnn-0.1.22}/src/rxnn/training/bml.py +0 -0
  18. {rxnn-0.1.21 → rxnn-0.1.22}/src/rxnn/training/callbacks.py +0 -0
  19. {rxnn-0.1.21 → rxnn-0.1.22}/src/rxnn/training/dataset.py +0 -0
  20. {rxnn-0.1.21 → rxnn-0.1.22}/src/rxnn/training/scheduler.py +0 -0
  21. {rxnn-0.1.21 → rxnn-0.1.22}/src/rxnn/training/tokenizer.py +0 -0
  22. {rxnn-0.1.21 → rxnn-0.1.22}/src/rxnn/transformers/__init__.py +0 -0
  23. {rxnn-0.1.21 → rxnn-0.1.22}/src/rxnn/transformers/attention.py +0 -0
  24. {rxnn-0.1.21 → rxnn-0.1.22}/src/rxnn/transformers/ff.py +0 -0
  25. {rxnn-0.1.21 → rxnn-0.1.22}/src/rxnn/transformers/layers.py +0 -0
  26. {rxnn-0.1.21 → rxnn-0.1.22}/src/rxnn/transformers/mask.py +0 -0
  27. {rxnn-0.1.21 → rxnn-0.1.22}/src/rxnn/transformers/models.py +0 -0
  28. {rxnn-0.1.21 → rxnn-0.1.22}/src/rxnn/transformers/moe.py +0 -0
  29. {rxnn-0.1.21 → rxnn-0.1.22}/src/rxnn/transformers/positional.py +0 -0
  30. {rxnn-0.1.21 → rxnn-0.1.22}/src/rxnn/transformers/sampler.py +0 -0
  31. {rxnn-0.1.21 → rxnn-0.1.22}/src/rxnn/utils.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.3
2
2
  Name: rxnn
3
- Version: 0.1.21
3
+ Version: 0.1.22
4
4
  Summary: RxNN: Reactive Neural Networks Platform
5
5
  License: Apache-2.0
6
6
  Keywords: deep-learning,ai,machine-learning
@@ -4,7 +4,7 @@ build-backend = "poetry.core.masonry.api"
4
4
 
5
5
  [tool.poetry]
6
6
  name = "rxnn"
7
- version = "0.1.21"
7
+ version = "0.1.22"
8
8
  description = "RxNN: Reactive Neural Networks Platform"
9
9
 
10
10
  license = "Apache-2.0"
@@ -229,11 +229,12 @@ class DeepMoeAttention(GroupedMoeAttention):
229
229
  weights_q = weights_q_flat.view(B, T, -1)
230
230
  indices_q = indices_q_flat.view(B, T, -1)
231
231
  q = self._process_grouped_experts(query, self.wq, self.bq, weights_q, indices_q)
232
+ print('processed q', q.size())
232
233
  q = q.permute(0, 2, 1, 3).reshape(B, self.num_query_groups, T, -1)
233
234
 
234
235
  # Expand query groups to match head count
235
236
  group_heads = self.num_heads // self.num_query_groups
236
- q = q.unsqueeze(2).expand(-1, -1, group_heads, -1, -1).flatten(1, 2).transpose(1, 2)
237
+ q = q.unsqueeze(2).expand(-1, -1, group_heads, -1, -1).flatten(1, 2)
237
238
 
238
239
  # Key/Value processing
239
240
  return super()._forward_qkv(q, key, value, b, t, d, skip_query_processing=True)
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes