rxnn 0.2.41__tar.gz → 0.2.42__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (39) hide show
  1. {rxnn-0.2.41 → rxnn-0.2.42}/PKG-INFO +1 -1
  2. {rxnn-0.2.41 → rxnn-0.2.42}/pyproject.toml +1 -1
  3. {rxnn-0.2.41 → rxnn-0.2.42}/src/rxnn/training/mrl.py +2 -2
  4. {rxnn-0.2.41 → rxnn-0.2.42}/LICENSE +0 -0
  5. {rxnn-0.2.41 → rxnn-0.2.42}/README.md +0 -0
  6. {rxnn-0.2.41 → rxnn-0.2.42}/src/rxnn/.DS_Store +0 -0
  7. {rxnn-0.2.41 → rxnn-0.2.42}/src/rxnn/__init__.py +0 -0
  8. {rxnn-0.2.41 → rxnn-0.2.42}/src/rxnn/experimental/__init__.py +0 -0
  9. {rxnn-0.2.41 → rxnn-0.2.42}/src/rxnn/experimental/attention.py +0 -0
  10. {rxnn-0.2.41 → rxnn-0.2.42}/src/rxnn/experimental/models.py +0 -0
  11. {rxnn-0.2.41 → rxnn-0.2.42}/src/rxnn/experimental/moe.py +0 -0
  12. {rxnn-0.2.41 → rxnn-0.2.42}/src/rxnn/memory/__init__.py +0 -0
  13. {rxnn-0.2.41 → rxnn-0.2.42}/src/rxnn/memory/attention.py +0 -0
  14. {rxnn-0.2.41 → rxnn-0.2.42}/src/rxnn/memory/norm.py +0 -0
  15. {rxnn-0.2.41 → rxnn-0.2.42}/src/rxnn/memory/stm.py +0 -0
  16. {rxnn-0.2.41 → rxnn-0.2.42}/src/rxnn/rxt/__init__.py +0 -0
  17. {rxnn-0.2.41 → rxnn-0.2.42}/src/rxnn/rxt/models.py +0 -0
  18. {rxnn-0.2.41 → rxnn-0.2.42}/src/rxnn/training/__init__.py +0 -0
  19. {rxnn-0.2.41 → rxnn-0.2.42}/src/rxnn/training/base.py +0 -0
  20. {rxnn-0.2.41 → rxnn-0.2.42}/src/rxnn/training/bml.py +0 -0
  21. {rxnn-0.2.41 → rxnn-0.2.42}/src/rxnn/training/callbacks.py +0 -0
  22. {rxnn-0.2.41 → rxnn-0.2.42}/src/rxnn/training/dataset.py +0 -0
  23. {rxnn-0.2.41 → rxnn-0.2.42}/src/rxnn/training/ddp.py +0 -0
  24. {rxnn-0.2.41 → rxnn-0.2.42}/src/rxnn/training/models.py +0 -0
  25. {rxnn-0.2.41 → rxnn-0.2.42}/src/rxnn/training/reward.py +0 -0
  26. {rxnn-0.2.41 → rxnn-0.2.42}/src/rxnn/training/rl.py +0 -0
  27. {rxnn-0.2.41 → rxnn-0.2.42}/src/rxnn/training/scheduler.py +0 -0
  28. {rxnn-0.2.41 → rxnn-0.2.42}/src/rxnn/training/tokenizer.py +0 -0
  29. {rxnn-0.2.41 → rxnn-0.2.42}/src/rxnn/training/utils.py +0 -0
  30. {rxnn-0.2.41 → rxnn-0.2.42}/src/rxnn/transformers/__init__.py +0 -0
  31. {rxnn-0.2.41 → rxnn-0.2.42}/src/rxnn/transformers/attention.py +0 -0
  32. {rxnn-0.2.41 → rxnn-0.2.42}/src/rxnn/transformers/ff.py +0 -0
  33. {rxnn-0.2.41 → rxnn-0.2.42}/src/rxnn/transformers/layers.py +0 -0
  34. {rxnn-0.2.41 → rxnn-0.2.42}/src/rxnn/transformers/mask.py +0 -0
  35. {rxnn-0.2.41 → rxnn-0.2.42}/src/rxnn/transformers/models.py +0 -0
  36. {rxnn-0.2.41 → rxnn-0.2.42}/src/rxnn/transformers/moe.py +0 -0
  37. {rxnn-0.2.41 → rxnn-0.2.42}/src/rxnn/transformers/positional.py +0 -0
  38. {rxnn-0.2.41 → rxnn-0.2.42}/src/rxnn/transformers/sampler.py +0 -0
  39. {rxnn-0.2.41 → rxnn-0.2.42}/src/rxnn/utils.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.3
2
2
  Name: rxnn
3
- Version: 0.2.41
3
+ Version: 0.2.42
4
4
  Summary: RxNN: Reactive Neural Networks Platform
5
5
  License: Apache-2.0
6
6
  Keywords: deep-learning,ai,machine-learning
@@ -4,7 +4,7 @@ build-backend = "poetry.core.masonry.api"
4
4
 
5
5
  [tool.poetry]
6
6
  name = "rxnn"
7
- version = "0.2.41"
7
+ version = "0.2.42"
8
8
  description = "RxNN: Reactive Neural Networks Platform"
9
9
 
10
10
  license = "Apache-2.0"
@@ -1022,7 +1022,7 @@ class MRLTrainer:
1022
1022
 
1023
1023
  return (epochs, unfreeze_epoch), (random_resets, random_resets_from, random_resets_ratio)
1024
1024
 
1025
- def __call__(self, curriculum_config: list[CurriculumConfig], batch_size: int):
1025
+ def __call__(self, curriculum_config: list[CurriculumConfig], batch_size: int, ddp_find_unused_parameters: bool = False):
1026
1026
  """Start Memory Reinforcement Learning Curriculum."""
1027
1027
 
1028
1028
  # 0. Set global epoch count for all stages
@@ -1033,7 +1033,7 @@ class MRLTrainer:
1033
1033
  if self.use_ddp:
1034
1034
  rank, world_size = get_os_ddp_config()
1035
1035
  dist.init_process_group(backend='nccl', rank=rank, world_size=world_size)
1036
- self.actor = DistributedDataParallel(self.actor, device_ids=[self.device.index])
1036
+ self.actor = DistributedDataParallel(self.actor, device_ids=[self.device.index], find_unused_parameters=ddp_find_unused_parameters)
1037
1037
  self.critic = DistributedDataParallel(self.critic, device_ids=[self.device.index])
1038
1038
 
1039
1039
  # 2. Init BatchSampler with actor model (we have to run it after DDP init)
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes