agilerl 2.4.2.dev1__tar.gz → 2.4.3.dev0__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (347) hide show
  1. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/.pre-commit-config.yaml +3 -3
  2. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/PKG-INFO +1 -1
  3. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/algorithms/core/base.py +1 -2
  4. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/algorithms/ippo.py +1 -1
  5. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/wrappers/agent.py +2 -2
  6. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/pyproject.toml +1 -1
  7. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_modules/test_make_evolvable.py +1 -4
  8. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_train/test_train.py +18 -6
  9. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/uv.lock +1 -1
  10. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/.coveragerc +0 -0
  11. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/.github/ISSUE_TEMPLATE/bug_report.md +0 -0
  12. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/.github/ISSUE_TEMPLATE/feature_request.md +0 -0
  13. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/.github/PULL_REQUEST_TEMPLATE/pull_request_template.md +0 -0
  14. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/.github/badges/arena-github-badge.svg +0 -0
  15. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/.github/workflows/codeql.yml +0 -0
  16. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/.github/workflows/python-app.yml +0 -0
  17. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/.gitignore +0 -0
  18. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/.readthedocs.yaml +0 -0
  19. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/CITATION.cff +0 -0
  20. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/CODE_OF_CONDUCT.md +0 -0
  21. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/CONTRIBUTING.md +0 -0
  22. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/LICENSE +0 -0
  23. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/README.md +0 -0
  24. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/__init__.py +0 -0
  25. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/algorithms/__init__.py +0 -0
  26. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/algorithms/bc_lm.py +0 -0
  27. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/algorithms/core/__init__.py +0 -0
  28. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/algorithms/core/optimizer_wrapper.py +0 -0
  29. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/algorithms/core/registry.py +0 -0
  30. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/algorithms/cqn.py +0 -0
  31. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/algorithms/ddpg.py +0 -0
  32. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/algorithms/dpo.py +0 -0
  33. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/algorithms/dqn.py +0 -0
  34. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/algorithms/dqn_rainbow.py +0 -0
  35. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/algorithms/grpo.py +0 -0
  36. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/algorithms/ilql.py +0 -0
  37. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/algorithms/maddpg.py +0 -0
  38. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/algorithms/matd3.py +0 -0
  39. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/algorithms/neural_ts_bandit.py +0 -0
  40. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/algorithms/neural_ucb_bandit.py +0 -0
  41. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/algorithms/ppo.py +0 -0
  42. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/algorithms/td3.py +0 -0
  43. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/components/__init__.py +0 -0
  44. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/components/data.py +0 -0
  45. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/components/multi_agent_replay_buffer.py +0 -0
  46. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/components/replay_buffer.py +0 -0
  47. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/components/rollout_buffer.py +0 -0
  48. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/components/sampler.py +0 -0
  49. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/components/segment_tree.py +0 -0
  50. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/data/__init__.py +0 -0
  51. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/data/language_environment.py +0 -0
  52. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/data/rl_data.py +0 -0
  53. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/data/tokenizer.py +0 -0
  54. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/data/torch_datasets.py +0 -0
  55. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/hpo/__init__.py +0 -0
  56. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/hpo/mutation.py +0 -0
  57. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/hpo/tournament.py +0 -0
  58. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/modules/__init__.py +0 -0
  59. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/modules/base.py +0 -0
  60. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/modules/bert.py +0 -0
  61. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/modules/cnn.py +0 -0
  62. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/modules/configs.py +0 -0
  63. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/modules/custom_components.py +0 -0
  64. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/modules/dummy.py +0 -0
  65. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/modules/gpt.py +0 -0
  66. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/modules/lstm.py +0 -0
  67. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/modules/mlp.py +0 -0
  68. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/modules/multi_input.py +0 -0
  69. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/modules/resnet.py +0 -0
  70. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/modules/simba.py +0 -0
  71. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/networks/__init__.py +0 -0
  72. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/networks/actors.py +0 -0
  73. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/networks/base.py +0 -0
  74. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/networks/custom_modules.py +0 -0
  75. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/networks/distributions.py +0 -0
  76. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/networks/distributions_experimental.py +0 -0
  77. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/networks/q_networks.py +0 -0
  78. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/networks/value_networks.py +0 -0
  79. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/protocols.py +0 -0
  80. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/rollouts/__init__.py +0 -0
  81. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/rollouts/on_policy.py +0 -0
  82. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/training/__init__.py +0 -0
  83. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/training/train_bandits.py +0 -0
  84. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/training/train_llm.py +0 -0
  85. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/training/train_multi_agent_off_policy.py +0 -0
  86. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/training/train_multi_agent_on_policy.py +0 -0
  87. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/training/train_off_policy.py +0 -0
  88. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/training/train_offline.py +0 -0
  89. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/training/train_on_policy.py +0 -0
  90. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/typing.py +0 -0
  91. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/utils/__init__.py +0 -0
  92. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/utils/algo_utils.py +0 -0
  93. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/utils/cache.py +0 -0
  94. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/utils/evolvable_networks.py +0 -0
  95. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/utils/ilql_utils.py +0 -0
  96. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/utils/llm_utils.py +0 -0
  97. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/utils/log_utils.py +0 -0
  98. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/utils/minari_utils.py +0 -0
  99. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/utils/probe_envs.py +0 -0
  100. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/utils/probe_envs_ma.py +0 -0
  101. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/utils/sampling_utils.py +0 -0
  102. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/utils/torch_utils.py +0 -0
  103. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/utils/utils.py +0 -0
  104. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/vector/__init__.py +0 -0
  105. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/vector/pz_async_vec_env.py +0 -0
  106. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/vector/pz_vec_env.py +0 -0
  107. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/wrappers/__init__.py +0 -0
  108. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/wrappers/learning.py +0 -0
  109. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/wrappers/make_evolvable.py +0 -0
  110. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/wrappers/pettingzoo_wrappers.py +0 -0
  111. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/wrappers/utils.py +0 -0
  112. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/benchmarking/benchmarking_bandits.py +0 -0
  113. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/benchmarking/benchmarking_dpo.py +0 -0
  114. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/benchmarking/benchmarking_grpo.py +0 -0
  115. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/benchmarking/benchmarking_multi_agent_off_policy.py +0 -0
  116. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/benchmarking/benchmarking_multi_agent_on_policy.py +0 -0
  117. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/benchmarking/benchmarking_off_policy.py +0 -0
  118. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/benchmarking/benchmarking_off_policy_distributed.py +0 -0
  119. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/benchmarking/benchmarking_offline.py +0 -0
  120. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/benchmarking/benchmarking_offline_distributed.py +0 -0
  121. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/benchmarking/benchmarking_on_policy.py +0 -0
  122. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/benchmarking/benchmarking_rainbow.py +0 -0
  123. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/benchmarking/benchmarking_recurrent.py +0 -0
  124. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/benchmarking/benchmarking_resnet.py +0 -0
  125. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/benchmarking/benchmarking_simba.py +0 -0
  126. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/benchmarking/configs/ds_config.json +0 -0
  127. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/benchmarking/make_evolvable_benchmarking.py +0 -0
  128. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/benchmarking/networks.py +0 -0
  129. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/configs/accelerate/accelerate.yaml +0 -0
  130. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/configs/accelerate/grpo_accelerate_config.yaml +0 -0
  131. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/configs/training/bandit/neural_ts.yaml +0 -0
  132. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/configs/training/bandit/neural_ucb.yaml +0 -0
  133. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/configs/training/cqn.yaml +0 -0
  134. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/configs/training/ddpg/ddpg.yaml +0 -0
  135. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/configs/training/ddpg/ddpg_lstm.yaml +0 -0
  136. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/configs/training/ddpg/ddpg_simba.yaml +0 -0
  137. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/configs/training/dpo.yaml +0 -0
  138. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/configs/training/dqn/dqn.yaml +0 -0
  139. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/configs/training/dqn/dqn_lstm.yaml +0 -0
  140. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/configs/training/dqn/dqn_rainbow.yaml +0 -0
  141. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/configs/training/grpo.yaml +0 -0
  142. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/configs/training/multi_agent/ippo.yaml +0 -0
  143. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/configs/training/multi_agent/ippo_pong.yaml +0 -0
  144. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/configs/training/multi_agent/maddpg.yaml +0 -0
  145. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/configs/training/multi_agent/matd3.yaml +0 -0
  146. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/configs/training/multi_input.yaml +0 -0
  147. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/configs/training/ppo/ppo.yaml +0 -0
  148. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/configs/training/ppo/ppo_image.yaml +0 -0
  149. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/configs/training/ppo/ppo_recurrent.yaml +0 -0
  150. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/configs/training/td3.yaml +0 -0
  151. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/data/cartpole/cartpole_random_v1.1.0.h5 +0 -0
  152. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/data/cartpole/cartpole_v1.1.0.h5 +0 -0
  153. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/data/pendulum/pendulum_random_v1.1.0.h5 +0 -0
  154. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/data/pendulum/pendulum_v1.1.0.h5 +0 -0
  155. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/demos/demo_bandit.py +0 -0
  156. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/demos/demo_custom_network.py +0 -0
  157. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/demos/demo_multi_agent.py +0 -0
  158. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/demos/demo_off_policy.py +0 -0
  159. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/demos/demo_off_policy_distributed.py +0 -0
  160. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/demos/demo_offline.py +0 -0
  161. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/demos/demo_offline_distributed.py +0 -0
  162. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/demos/demo_on_policy.py +0 -0
  163. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/demos/demo_on_policy_rnn_cartpole.py +0 -0
  164. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/demos/demo_on_policy_rnn_memory.py +0 -0
  165. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/demos/demo_on_policy_rnn_minigrid.py +0 -0
  166. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/demos/performance_flamegraph_cartpole.py +0 -0
  167. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/demos/performance_flamegraph_lunar_lander.py +0 -0
  168. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/demos/performance_flamegraph_lunar_lander_rnn.py +0 -0
  169. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/demos/performance_flamegraph_rnn_memory.py +0 -0
  170. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/dependabot.yml +0 -0
  171. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/Makefile +0 -0
  172. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/_static/arena-github-badge.svg +0 -0
  173. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/_static/css/custom.css +0 -0
  174. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/_static/favicon.ico +0 -0
  175. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/_static/js/expand_sidebar.js +0 -0
  176. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/_static/logo_teal.png +0 -0
  177. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/_static/logo_white.png +0 -0
  178. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/_static/module.png +0 -0
  179. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/_static/network.png +0 -0
  180. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/_static/thumbnails/iris-thumbnail.png +0 -0
  181. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/_static/thumbnails/pendigits-thumbnail.png +0 -0
  182. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/_static/thumbnails/rainbow_performance.png +0 -0
  183. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/_static/thumbnails/simba_thumbnail.png +0 -0
  184. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/algorithms/base.rst +0 -0
  185. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/algorithms/cql.rst +0 -0
  186. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/algorithms/ddpg.rst +0 -0
  187. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/algorithms/dpo.rst +0 -0
  188. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/algorithms/dqn.rst +0 -0
  189. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/algorithms/dqn_rainbow.rst +0 -0
  190. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/algorithms/grpo.rst +0 -0
  191. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/algorithms/ilql.rst +0 -0
  192. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/algorithms/index.rst +0 -0
  193. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/algorithms/ippo.rst +0 -0
  194. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/algorithms/maddpg.rst +0 -0
  195. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/algorithms/matd3.rst +0 -0
  196. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/algorithms/neural_ts.rst +0 -0
  197. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/algorithms/neural_ucb.rst +0 -0
  198. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/algorithms/ppo.rst +0 -0
  199. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/algorithms/registry.rst +0 -0
  200. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/algorithms/td3.rst +0 -0
  201. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/algorithms/wrappers.rst +0 -0
  202. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/components/data.rst +0 -0
  203. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/components/index.rst +0 -0
  204. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/components/multi_agent_replay_buffer.rst +0 -0
  205. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/components/replay_buffer.rst +0 -0
  206. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/components/rollout_buffer.rst +0 -0
  207. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/components/sampler.rst +0 -0
  208. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/components/segment_tree.rst +0 -0
  209. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/hpo/index.rst +0 -0
  210. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/hpo/mutation.rst +0 -0
  211. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/hpo/tournament.rst +0 -0
  212. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/modules/base.rst +0 -0
  213. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/modules/bert.rst +0 -0
  214. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/modules/cnn.rst +0 -0
  215. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/modules/custom_activation.rst +0 -0
  216. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/modules/dummy.rst +0 -0
  217. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/modules/gpt.rst +0 -0
  218. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/modules/index.rst +0 -0
  219. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/modules/lstm.rst +0 -0
  220. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/modules/mlp.rst +0 -0
  221. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/modules/multi_input.rst +0 -0
  222. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/modules/resnet.rst +0 -0
  223. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/modules/simba.rst +0 -0
  224. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/networks/actors.rst +0 -0
  225. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/networks/base.rst +0 -0
  226. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/networks/index.rst +0 -0
  227. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/networks/q_networks.rst +0 -0
  228. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/networks/value_networks.rst +0 -0
  229. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/rollouts/index.rst +0 -0
  230. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/rollouts/on_policy.rst +0 -0
  231. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/train.rst +0 -0
  232. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/utils/algo_utils.rst +0 -0
  233. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/utils/cache.rst +0 -0
  234. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/utils/evolvable_networks.rst +0 -0
  235. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/utils/ilql_utils.rst +0 -0
  236. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/utils/index.rst +0 -0
  237. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/utils/llm_utils.rst +0 -0
  238. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/utils/log_utils.rst +0 -0
  239. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/utils/minari_utils.rst +0 -0
  240. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/utils/probe_envs.rst +0 -0
  241. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/utils/torch_utils.rst +0 -0
  242. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/utils/utils.rst +0 -0
  243. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/vector/index.rst +0 -0
  244. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/vector/petting_zoo_async_vector_env.rst +0 -0
  245. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/vector/petting_zoo_vector_env.rst +0 -0
  246. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/wrappers/agent.rst +0 -0
  247. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/wrappers/index.rst +0 -0
  248. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/wrappers/learning.rst +0 -0
  249. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/wrappers/make_evolvable.rst +0 -0
  250. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/wrappers/pettingzoo.rst +0 -0
  251. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/bandits/index.rst +0 -0
  252. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/conf.py +0 -0
  253. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/custom_algorithms/index.rst +0 -0
  254. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/debugging_rl/index.rst +0 -0
  255. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/distributed_training/index.rst +0 -0
  256. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/evo_hyperparam_opt/index.rst +0 -0
  257. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/evolvable_networks/index.rst +0 -0
  258. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/get_started/agilerl2changes.rst +0 -0
  259. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/get_started/index.rst +0 -0
  260. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/index.rst +0 -0
  261. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/llm_finetuning/index.rst +0 -0
  262. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/make.bat +0 -0
  263. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/multi_agent_training/index.rst +0 -0
  264. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/off_policy/index.rst +0 -0
  265. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/offline_training/index.rst +0 -0
  266. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/on_policy/index.rst +0 -0
  267. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/pomdp/index.rst +0 -0
  268. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/releases/index.rst +0 -0
  269. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/requirements.txt +0 -0
  270. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/pytest.ini +0 -0
  271. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/__init__.py +0 -0
  272. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/conftest.py +0 -0
  273. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/helper_functions.py +0 -0
  274. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/pz_vector_test_utils.py +0 -0
  275. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_algorithms/__init__.py +0 -0
  276. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_algorithms/test_bandits/__init__.py +0 -0
  277. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_algorithms/test_bandits/test_neural_ts.py +0 -0
  278. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_algorithms/test_bandits/test_neural_ucb.py +0 -0
  279. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_algorithms/test_base.py +0 -0
  280. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_algorithms/test_bc_lm.py +0 -0
  281. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_algorithms/test_llms/__init__.py +0 -0
  282. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_algorithms/test_llms/conftest.py +0 -0
  283. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_algorithms/test_llms/test_dpo.py +0 -0
  284. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_algorithms/test_llms/test_grpo.py +0 -0
  285. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_algorithms/test_multi_agent/__init__.py +0 -0
  286. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_algorithms/test_multi_agent/test_ippo.py +0 -0
  287. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_algorithms/test_multi_agent/test_maddpg.py +0 -0
  288. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_algorithms/test_multi_agent/test_matd3.py +0 -0
  289. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_algorithms/test_optimizer_wrapper.py +0 -0
  290. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_algorithms/test_registry.py +0 -0
  291. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_algorithms/test_single_agent/__init__.py +0 -0
  292. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_algorithms/test_single_agent/test_cqn.py +0 -0
  293. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_algorithms/test_single_agent/test_ddpg.py +0 -0
  294. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_algorithms/test_single_agent/test_dqn.py +0 -0
  295. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_algorithms/test_single_agent/test_dqn_rainbow.py +0 -0
  296. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_algorithms/test_single_agent/test_ilql.py +0 -0
  297. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_algorithms/test_single_agent/test_ppo.py +0 -0
  298. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_algorithms/test_single_agent/test_td3.py +0 -0
  299. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_components/__init__.py +0 -0
  300. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_components/test_multi_agent_replay_buffer.py +0 -0
  301. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_components/test_replay_buffer.py +0 -0
  302. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_components/test_replay_data.py +0 -0
  303. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_components/test_rollout_buffer.py +0 -0
  304. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_components/test_sampler.py +0 -0
  305. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_components/test_segment_tree.py +0 -0
  306. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_data.py +0 -0
  307. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_hpo/__init__.py +0 -0
  308. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_hpo/test_mutation.py +0 -0
  309. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_hpo/test_tournament.py +0 -0
  310. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_modules/__init__.py +0 -0
  311. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_modules/test_base.py +0 -0
  312. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_modules/test_bert.py +0 -0
  313. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_modules/test_cnn.py +0 -0
  314. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_modules/test_custom_activation.py +0 -0
  315. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_modules/test_dummy.py +0 -0
  316. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_modules/test_gpt.py +0 -0
  317. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_modules/test_lstm.py +0 -0
  318. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_modules/test_mlp.py +0 -0
  319. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_modules/test_multi_input.py +0 -0
  320. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_modules/test_resnet.py +0 -0
  321. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_modules/test_simba.py +0 -0
  322. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_networks/__init__.py +0 -0
  323. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_networks/test_actors.py +0 -0
  324. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_networks/test_base.py +0 -0
  325. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_networks/test_q_networks.py +0 -0
  326. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_networks/test_value_functions.py +0 -0
  327. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_protocols.py +0 -0
  328. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_train/test_train_llm.py +0 -0
  329. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_utils/__init__.py +0 -0
  330. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_utils/test_algo_utils.py +0 -0
  331. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_utils/test_cache.py +0 -0
  332. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_utils/test_ilql_utils.py +0 -0
  333. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_utils/test_llm_utils.py +0 -0
  334. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_utils/test_log_utils.py +0 -0
  335. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_utils/test_minari_utils.py +0 -0
  336. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_utils/test_probe_envs.py +0 -0
  337. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_utils/test_probe_envs_ma.py +0 -0
  338. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_utils/test_sampling_utils.py +0 -0
  339. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_utils/test_torch_utils.py +0 -0
  340. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_utils/test_utils.py +0 -0
  341. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_utils/test_utils_evolvable.py +0 -0
  342. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_vector/test_vector.py +0 -0
  343. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_wrappers/__init__.py +0 -0
  344. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_wrappers/test_agent.py +0 -0
  345. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_wrappers/test_autoreset.py +0 -0
  346. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_wrappers/test_bandit_env.py +0 -0
  347. {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_wrappers/test_skills.py +0 -0
@@ -24,7 +24,7 @@ repos:
24
24
  - id: mixed-line-ending
25
25
  args: [--fix=lf]
26
26
  - repo: https://github.com/psf/black-pre-commit-mirror
27
- rev: 25.12.0
27
+ rev: 26.1.0
28
28
  hooks:
29
29
  - id: black
30
30
  - repo: https://github.com/codespell-project/codespell
@@ -35,7 +35,7 @@ repos:
35
35
  - --skip=*.css,*.js,*.map,*.scss,*.svg
36
36
  - --ignore-words-list=magent,pres,roate
37
37
  - repo: https://github.com/astral-sh/ruff-pre-commit
38
- rev: v0.14.9
38
+ rev: v0.14.14
39
39
  hooks:
40
40
  - id: ruff-check
41
41
  args:
@@ -53,6 +53,6 @@ repos:
53
53
  - id: yamlfmt
54
54
  - repo: https://github.com/astral-sh/uv-pre-commit
55
55
  # uv version.
56
- rev: 0.9.27
56
+ rev: 0.9.28
57
57
  hooks:
58
58
  - id: uv-lock
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: agilerl
3
- Version: 2.4.2.dev1
3
+ Version: 2.4.3.dev0
4
4
  Summary: AgileRL is a deep reinforcement learning library focused on improving RL development through RLOps.
5
5
  Author-email: Nick Ustaran-Anderegg <dev@agilerl.com>
6
6
  License-Expression: Apache-2.0
@@ -2066,8 +2066,7 @@ class LLMAlgorithm(EvolvableAlgorithm, ABC):
2066
2066
  accelerator: Optional[Accelerator] = None,
2067
2067
  ) -> None:
2068
2068
  raise NotImplementedError(
2069
- "The load class method is not supported for this algorithm class."
2070
- """
2069
+ "The load class method is not supported for this algorithm class." """
2071
2070
  To load a saved LLM, please load the model as follows, and then re-instantiate the GRPO
2072
2071
  class, using the pre-trained model.
2073
2072
 
@@ -671,7 +671,7 @@ class IPPO(MultiAgentRLAlgorithm):
671
671
  :param action_space: Action space for the agent
672
672
  :type action_space: gymnasium.spaces
673
673
  """
674
- (states, actions, log_probs, rewards, dones, values, next_state, next_done) = (
674
+ states, actions, log_probs, rewards, dones, values, next_state, next_done = (
675
675
  experiences
676
676
  )
677
677
 
@@ -597,8 +597,8 @@ class AsyncAgentsWrapper(AgentWrapper[MultiAgentRLAlgorithm]):
597
597
  :return: Learning information
598
598
  :rtype: Any
599
599
  """
600
- (states, actions, log_probs, rewards, dones, values, next_state, next_done) = (
601
- map(self.stack_experiences, experiences)
600
+ states, actions, log_probs, rewards, dones, values, next_state, next_done = map(
601
+ self.stack_experiences, experiences
602
602
  )
603
603
 
604
604
  # Handle case where we haven't collected a next state for each sub-agent
@@ -1,6 +1,6 @@
1
1
  [project]
2
2
  name = "agilerl"
3
- version = "2.4.2.dev1"
3
+ version = "2.4.3.dev0"
4
4
  description = "AgileRL is a deep reinforcement learning library focused on improving RL development through RLOps."
5
5
  authors = [{ name = "Nick Ustaran-Anderegg", email = "dev@agilerl.com" }]
6
6
  license = "Apache-2.0"
@@ -194,9 +194,7 @@ def test_instantiation_with_rainbow():
194
194
  network, input_tensor, support=support, rainbow=True
195
195
  )
196
196
  assert isinstance(evolvable_network, MakeEvolvable)
197
- assert (
198
- str(evolvable_network)
199
- == """MakeEvolvable(
197
+ assert str(evolvable_network) == """MakeEvolvable(
200
198
  (feature_net): Sequential(
201
199
  (feature_linear_layer_0): Linear(in_features=3, out_features=128, bias=True)
202
200
  (feature_activation_0): ReLU()
@@ -212,7 +210,6 @@ def test_instantiation_with_rainbow():
212
210
  (advantage_linear_layer_output): NoisyLinear(in_features=8, out_features=102)
213
211
  )
214
212
  )"""
215
- )
216
213
  del network, evolvable_network
217
214
 
218
215
 
@@ -1498,8 +1498,10 @@ def test_train_off_policy_agent_calls_made_rainbow(
1498
1498
  def test_train_off_policy_save_elite_warning(
1499
1499
  env, population_off_policy, tournament, mutations, memory
1500
1500
  ):
1501
- warning_string = "'save_elite' set to False but 'elite_path' has been defined, elite will not\
1501
+ warning_string = (
1502
+ "'save_elite' set to False but 'elite_path' has been defined, elite will not\
1502
1503
  be saved unless 'save_elite' is set to True."
1504
+ )
1503
1505
  with pytest.warns(match=warning_string):
1504
1506
  pop, pop_fitnesses = train_off_policy(
1505
1507
  env,
@@ -2137,8 +2139,10 @@ def test_train_on_policy_save_elite_warning(
2137
2139
  tournament,
2138
2140
  mutations,
2139
2141
  ):
2140
- warning_string = "'save_elite' set to False but 'elite_path' has been defined, elite will not\
2142
+ warning_string = (
2143
+ "'save_elite' set to False but 'elite_path' has been defined, elite will not\
2141
2144
  be saved unless 'save_elite' is set to True."
2145
+ )
2142
2146
  with pytest.warns(match=warning_string):
2143
2147
  pop, pop_fitnesses = train_on_policy(
2144
2148
  env,
@@ -2703,8 +2707,10 @@ def test_train_multi_agent_on_policy_rgb_vectorized(
2703
2707
  def test_train_multi_save_elite_warning(
2704
2708
  multi_env, population_multi_agent, on_policy, multi_memory, tournament, mutations
2705
2709
  ):
2706
- warning_string = "'save_elite' set to False but 'elite_path' has been defined, elite will not\
2710
+ warning_string = (
2711
+ "'save_elite' set to False but 'elite_path' has been defined, elite will not\
2707
2712
  be saved unless 'save_elite' is set to True."
2713
+ )
2708
2714
  with pytest.warns(match=warning_string):
2709
2715
  pop, pop_fitnesses = train_multi_agent_off_policy(
2710
2716
  multi_env,
@@ -2730,8 +2736,10 @@ def test_train_multi_save_elite_warning(
2730
2736
  def test_train_multi_save_elite_warning_on_policy(
2731
2737
  multi_env, population_multi_agent, on_policy, multi_memory, tournament, mutations
2732
2738
  ):
2733
- warning_string = "'save_elite' set to False but 'elite_path' has been defined, elite will not\
2739
+ warning_string = (
2740
+ "'save_elite' set to False but 'elite_path' has been defined, elite will not\
2734
2741
  be saved unless 'save_elite' is set to True."
2742
+ )
2735
2743
  with pytest.warns(match=warning_string):
2736
2744
  pop, pop_fitnesses = train_multi_agent_on_policy(
2737
2745
  multi_env,
@@ -3567,8 +3575,10 @@ def test_train_offline_save_elite_warning(
3567
3575
  offline_init_hp,
3568
3576
  dummy_h5py_data,
3569
3577
  ):
3570
- warning_string = "'save_elite' set to False but 'elite_path' has been defined, elite will not\
3578
+ warning_string = (
3579
+ "'save_elite' set to False but 'elite_path' has been defined, elite will not\
3571
3580
  be saved unless 'save_elite' is set to True."
3581
+ )
3572
3582
  with pytest.warns(match=warning_string):
3573
3583
  pop, pop_fitness = train_offline(
3574
3584
  env,
@@ -4057,8 +4067,10 @@ def test_train_bandit_agent_calls_made(
4057
4067
  def test_train_bandit_save_elite_warning(
4058
4068
  bandit_env, population_bandit, tournament, mutations, bandit_memory
4059
4069
  ):
4060
- warning_string = "'save_elite' set to False but 'elite_path' has been defined, elite will not\
4070
+ warning_string = (
4071
+ "'save_elite' set to False but 'elite_path' has been defined, elite will not\
4061
4072
  be saved unless 'save_elite' is set to True."
4073
+ )
4062
4074
  with pytest.warns(match=warning_string):
4063
4075
  pop, pop_fitnesses = train_bandits(
4064
4076
  bandit_env,
@@ -53,7 +53,7 @@ wheels = [
53
53
 
54
54
  [[package]]
55
55
  name = "agilerl"
56
- version = "2.4.2.dev1"
56
+ version = "2.4.3.dev0"
57
57
  source = { editable = "." }
58
58
  dependencies = [
59
59
  { name = "accelerate" },
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes