rxnn 0.2.64__tar.gz → 0.2.66__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (39) hide show
  1. {rxnn-0.2.64 → rxnn-0.2.66}/PKG-INFO +1 -1
  2. {rxnn-0.2.64 → rxnn-0.2.66}/pyproject.toml +1 -1
  3. {rxnn-0.2.64 → rxnn-0.2.66}/src/rxnn/rxt/models.py +2 -1
  4. {rxnn-0.2.64 → rxnn-0.2.66}/src/rxnn/training/utils.py +5 -1
  5. {rxnn-0.2.64 → rxnn-0.2.66}/LICENSE +0 -0
  6. {rxnn-0.2.64 → rxnn-0.2.66}/README.md +0 -0
  7. {rxnn-0.2.64 → rxnn-0.2.66}/src/rxnn/.DS_Store +0 -0
  8. {rxnn-0.2.64 → rxnn-0.2.66}/src/rxnn/__init__.py +0 -0
  9. {rxnn-0.2.64 → rxnn-0.2.66}/src/rxnn/experimental/__init__.py +0 -0
  10. {rxnn-0.2.64 → rxnn-0.2.66}/src/rxnn/experimental/attention.py +0 -0
  11. {rxnn-0.2.64 → rxnn-0.2.66}/src/rxnn/experimental/models.py +0 -0
  12. {rxnn-0.2.64 → rxnn-0.2.66}/src/rxnn/experimental/moe.py +0 -0
  13. {rxnn-0.2.64 → rxnn-0.2.66}/src/rxnn/memory/__init__.py +0 -0
  14. {rxnn-0.2.64 → rxnn-0.2.66}/src/rxnn/memory/attention.py +0 -0
  15. {rxnn-0.2.64 → rxnn-0.2.66}/src/rxnn/memory/norm.py +0 -0
  16. {rxnn-0.2.64 → rxnn-0.2.66}/src/rxnn/memory/stm.py +0 -0
  17. {rxnn-0.2.64 → rxnn-0.2.66}/src/rxnn/rxt/__init__.py +0 -0
  18. {rxnn-0.2.64 → rxnn-0.2.66}/src/rxnn/training/__init__.py +0 -0
  19. {rxnn-0.2.64 → rxnn-0.2.66}/src/rxnn/training/base.py +0 -0
  20. {rxnn-0.2.64 → rxnn-0.2.66}/src/rxnn/training/bml.py +0 -0
  21. {rxnn-0.2.64 → rxnn-0.2.66}/src/rxnn/training/callbacks.py +0 -0
  22. {rxnn-0.2.64 → rxnn-0.2.66}/src/rxnn/training/dataset.py +0 -0
  23. {rxnn-0.2.64 → rxnn-0.2.66}/src/rxnn/training/ddp.py +0 -0
  24. {rxnn-0.2.64 → rxnn-0.2.66}/src/rxnn/training/models.py +0 -0
  25. {rxnn-0.2.64 → rxnn-0.2.66}/src/rxnn/training/mrl.py +0 -0
  26. {rxnn-0.2.64 → rxnn-0.2.66}/src/rxnn/training/reward.py +0 -0
  27. {rxnn-0.2.64 → rxnn-0.2.66}/src/rxnn/training/rl.py +0 -0
  28. {rxnn-0.2.64 → rxnn-0.2.66}/src/rxnn/training/scheduler.py +0 -0
  29. {rxnn-0.2.64 → rxnn-0.2.66}/src/rxnn/training/tokenizer.py +0 -0
  30. {rxnn-0.2.64 → rxnn-0.2.66}/src/rxnn/transformers/__init__.py +0 -0
  31. {rxnn-0.2.64 → rxnn-0.2.66}/src/rxnn/transformers/attention.py +0 -0
  32. {rxnn-0.2.64 → rxnn-0.2.66}/src/rxnn/transformers/ff.py +0 -0
  33. {rxnn-0.2.64 → rxnn-0.2.66}/src/rxnn/transformers/layers.py +0 -0
  34. {rxnn-0.2.64 → rxnn-0.2.66}/src/rxnn/transformers/mask.py +0 -0
  35. {rxnn-0.2.64 → rxnn-0.2.66}/src/rxnn/transformers/models.py +0 -0
  36. {rxnn-0.2.64 → rxnn-0.2.66}/src/rxnn/transformers/moe.py +0 -0
  37. {rxnn-0.2.64 → rxnn-0.2.66}/src/rxnn/transformers/positional.py +0 -0
  38. {rxnn-0.2.64 → rxnn-0.2.66}/src/rxnn/transformers/sampler.py +0 -0
  39. {rxnn-0.2.64 → rxnn-0.2.66}/src/rxnn/utils.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.3
2
2
  Name: rxnn
3
- Version: 0.2.64
3
+ Version: 0.2.66
4
4
  Summary: RxNN: Reactive Neural Networks Platform
5
5
  License: Apache-2.0
6
6
  Keywords: deep-learning,ai,machine-learning
@@ -4,7 +4,7 @@ build-backend = "poetry.core.masonry.api"
4
4
 
5
5
  [tool.poetry]
6
6
  name = "rxnn"
7
- version = "0.2.64"
7
+ version = "0.2.66"
8
8
  description = "RxNN: Reactive Neural Networks Platform"
9
9
 
10
10
  license = "Apache-2.0"
@@ -268,6 +268,7 @@ class RxTAlphaMemoryAttention(nn.Module, PyTorchModelHubMixin, license="apache-2
268
268
  residual_per_slot_gate: bool = False,
269
269
  residual_init_gate: float = 0.0,
270
270
  use_dynamic_residual_gate: bool = False,
271
+ use_tanh_residual_gate: bool = False,
271
272
  debug_mode: bool = False,
272
273
  debug_interval: int = 10,
273
274
  **kwargs,
@@ -300,7 +301,7 @@ class RxTAlphaMemoryAttention(nn.Module, PyTorchModelHubMixin, license="apache-2
300
301
  stm, attention_layers, memory_norm_layers,
301
302
  use_gated_residual=use_gated_residual, per_slot_gate=residual_per_slot_gate,
302
303
  init_gate=residual_init_gate, use_dynamic_gate=use_dynamic_residual_gate,
303
- debug_mode=debug_mode, debug_interval=debug_interval,
304
+ use_tanh_gate=use_tanh_residual_gate, debug_mode=debug_mode, debug_interval=debug_interval,
304
305
  )
305
306
 
306
307
  def freeze(self):
@@ -151,5 +151,9 @@ def get_gradient_norms(model: nn.Module):
151
151
  param_norm = p.grad.data.norm(2)
152
152
  total_norm += param_norm.item() ** 2
153
153
  total_norm = total_norm ** 0.5
154
- mean_norm = total_norm / len(grad_params)
154
+ params_len = len(grad_params)
155
+ if params_len != 0:
156
+ mean_norm = total_norm / params_len
157
+ else:
158
+ mean_norm = 0.0
155
159
  return total_norm, mean_norm
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes