agilerl 2.5.0.dev2__tar.gz → 2.5.0.dev4__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (349) hide show
  1. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/.pre-commit-config.yaml +2 -2
  2. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/PKG-INFO +1 -1
  3. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/algorithms/core/base.py +4 -5
  4. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/algorithms/maddpg.py +1 -1
  5. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/algorithms/matd3.py +1 -1
  6. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/utils/algo_utils.py +17 -0
  7. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/configs/training/multi_agent/maddpg.yaml +2 -1
  8. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/pyproject.toml +1 -1
  9. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/uv.lock +1 -1
  10. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/.github/ISSUE_TEMPLATE/bug_report.md +0 -0
  11. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/.github/ISSUE_TEMPLATE/feature_request.md +0 -0
  12. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/.github/PULL_REQUEST_TEMPLATE/pull_request_template.md +0 -0
  13. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/.github/badges/arena-github-badge.svg +0 -0
  14. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/.github/workflows/codeql.yml +0 -0
  15. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/.github/workflows/python-app.yml +0 -0
  16. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/.gitignore +0 -0
  17. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/.readthedocs.yaml +0 -0
  18. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/CITATION.cff +0 -0
  19. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/CODE_OF_CONDUCT.md +0 -0
  20. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/CONTRIBUTING.md +0 -0
  21. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/LICENSE +0 -0
  22. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/README.md +0 -0
  23. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/__init__.py +0 -0
  24. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/algorithms/__init__.py +0 -0
  25. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/algorithms/bc_lm.py +0 -0
  26. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/algorithms/core/__init__.py +0 -0
  27. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/algorithms/core/optimizer_wrapper.py +0 -0
  28. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/algorithms/core/registry.py +0 -0
  29. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/algorithms/cqn.py +0 -0
  30. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/algorithms/ddpg.py +0 -0
  31. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/algorithms/dpo.py +0 -0
  32. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/algorithms/dqn.py +0 -0
  33. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/algorithms/dqn_rainbow.py +0 -0
  34. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/algorithms/grpo.py +0 -0
  35. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/algorithms/ilql.py +0 -0
  36. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/algorithms/ippo.py +0 -0
  37. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/algorithms/neural_ts_bandit.py +0 -0
  38. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/algorithms/neural_ucb_bandit.py +0 -0
  39. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/algorithms/ppo.py +0 -0
  40. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/algorithms/td3.py +0 -0
  41. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/components/__init__.py +0 -0
  42. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/components/data.py +0 -0
  43. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/components/multi_agent_replay_buffer.py +0 -0
  44. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/components/replay_buffer.py +0 -0
  45. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/components/rollout_buffer.py +0 -0
  46. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/components/sampler.py +0 -0
  47. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/components/segment_tree.py +0 -0
  48. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/data/__init__.py +0 -0
  49. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/data/language_environment.py +0 -0
  50. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/data/rl_data.py +0 -0
  51. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/data/tokenizer.py +0 -0
  52. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/data/torch_datasets.py +0 -0
  53. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/hpo/__init__.py +0 -0
  54. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/hpo/mutation.py +0 -0
  55. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/hpo/tournament.py +0 -0
  56. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/modules/__init__.py +0 -0
  57. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/modules/base.py +0 -0
  58. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/modules/bert.py +0 -0
  59. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/modules/cnn.py +0 -0
  60. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/modules/configs.py +0 -0
  61. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/modules/custom_components.py +0 -0
  62. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/modules/dummy.py +0 -0
  63. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/modules/gpt.py +0 -0
  64. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/modules/lstm.py +0 -0
  65. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/modules/mlp.py +0 -0
  66. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/modules/multi_input.py +0 -0
  67. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/modules/resnet.py +0 -0
  68. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/modules/simba.py +0 -0
  69. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/networks/__init__.py +0 -0
  70. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/networks/actors.py +0 -0
  71. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/networks/base.py +0 -0
  72. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/networks/custom_modules.py +0 -0
  73. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/networks/distributions.py +0 -0
  74. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/networks/q_networks.py +0 -0
  75. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/networks/value_networks.py +0 -0
  76. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/protocols.py +0 -0
  77. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/rollouts/__init__.py +0 -0
  78. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/rollouts/on_policy.py +0 -0
  79. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/training/__init__.py +0 -0
  80. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/training/train_bandits.py +0 -0
  81. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/training/train_llm.py +0 -0
  82. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/training/train_multi_agent_off_policy.py +0 -0
  83. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/training/train_multi_agent_on_policy.py +0 -0
  84. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/training/train_off_policy.py +0 -0
  85. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/training/train_offline.py +0 -0
  86. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/training/train_on_policy.py +0 -0
  87. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/typing.py +0 -0
  88. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/utils/__init__.py +0 -0
  89. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/utils/cache.py +0 -0
  90. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/utils/evolvable_networks.py +0 -0
  91. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/utils/ilql_utils.py +0 -0
  92. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/utils/llm_utils.py +0 -0
  93. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/utils/log_utils.py +0 -0
  94. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/utils/minari_utils.py +0 -0
  95. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/utils/probe_envs.py +0 -0
  96. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/utils/probe_envs_ma.py +0 -0
  97. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/utils/sampling_utils.py +0 -0
  98. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/utils/torch_utils.py +0 -0
  99. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/utils/utils.py +0 -0
  100. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/vector/__init__.py +0 -0
  101. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/vector/pz_async_vec_env.py +0 -0
  102. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/vector/pz_vec_env.py +0 -0
  103. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/wrappers/__init__.py +0 -0
  104. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/wrappers/agent.py +0 -0
  105. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/wrappers/learning.py +0 -0
  106. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/wrappers/make_evolvable.py +0 -0
  107. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/wrappers/pettingzoo_wrappers.py +0 -0
  108. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/wrappers/utils.py +0 -0
  109. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/benchmarking/benchmarking_bandits.py +0 -0
  110. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/benchmarking/benchmarking_dpo.py +0 -0
  111. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/benchmarking/benchmarking_grpo.py +0 -0
  112. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/benchmarking/benchmarking_multi_agent_off_policy.py +0 -0
  113. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/benchmarking/benchmarking_multi_agent_on_policy.py +0 -0
  114. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/benchmarking/benchmarking_off_policy.py +0 -0
  115. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/benchmarking/benchmarking_off_policy_distributed.py +0 -0
  116. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/benchmarking/benchmarking_offline.py +0 -0
  117. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/benchmarking/benchmarking_offline_distributed.py +0 -0
  118. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/benchmarking/benchmarking_on_policy.py +0 -0
  119. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/benchmarking/benchmarking_rainbow.py +0 -0
  120. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/benchmarking/benchmarking_recurrent.py +0 -0
  121. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/benchmarking/benchmarking_resnet.py +0 -0
  122. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/benchmarking/benchmarking_simba.py +0 -0
  123. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/benchmarking/configs/ds_config.json +0 -0
  124. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/benchmarking/make_evolvable_benchmarking.py +0 -0
  125. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/benchmarking/networks.py +0 -0
  126. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/configs/accelerate/accelerate.yaml +0 -0
  127. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/configs/accelerate/grpo_accelerate_config.yaml +0 -0
  128. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/configs/training/bandit/neural_ts.yaml +0 -0
  129. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/configs/training/bandit/neural_ucb.yaml +0 -0
  130. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/configs/training/cqn.yaml +0 -0
  131. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/configs/training/ddpg/ddpg.yaml +0 -0
  132. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/configs/training/ddpg/ddpg_lstm.yaml +0 -0
  133. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/configs/training/ddpg/ddpg_simba.yaml +0 -0
  134. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/configs/training/dpo.yaml +0 -0
  135. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/configs/training/dqn/dqn.yaml +0 -0
  136. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/configs/training/dqn/dqn_lstm.yaml +0 -0
  137. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/configs/training/dqn/dqn_rainbow.yaml +0 -0
  138. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/configs/training/grpo.yaml +0 -0
  139. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/configs/training/multi_agent/ippo.yaml +0 -0
  140. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/configs/training/multi_agent/ippo_pong.yaml +0 -0
  141. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/configs/training/multi_agent/matd3.yaml +0 -0
  142. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/configs/training/multi_input.yaml +0 -0
  143. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/configs/training/ppo/ppo.yaml +0 -0
  144. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/configs/training/ppo/ppo_image.yaml +0 -0
  145. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/configs/training/ppo/ppo_recurrent.yaml +0 -0
  146. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/configs/training/td3.yaml +0 -0
  147. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/data/cartpole/cartpole_random_v1.1.0.h5 +0 -0
  148. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/data/cartpole/cartpole_v1.1.0.h5 +0 -0
  149. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/data/pendulum/pendulum_random_v1.1.0.h5 +0 -0
  150. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/data/pendulum/pendulum_v1.1.0.h5 +0 -0
  151. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/demos/demo_bandit.py +0 -0
  152. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/demos/demo_custom_network.py +0 -0
  153. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/demos/demo_multi_agent.py +0 -0
  154. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/demos/demo_off_policy.py +0 -0
  155. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/demos/demo_off_policy_distributed.py +0 -0
  156. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/demos/demo_offline.py +0 -0
  157. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/demos/demo_offline_distributed.py +0 -0
  158. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/demos/demo_on_policy.py +0 -0
  159. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/demos/demo_on_policy_rnn_cartpole.py +0 -0
  160. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/demos/demo_on_policy_rnn_memory.py +0 -0
  161. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/demos/demo_on_policy_rnn_minigrid.py +0 -0
  162. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/demos/performance_flamegraph_cartpole.py +0 -0
  163. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/demos/performance_flamegraph_lunar_lander.py +0 -0
  164. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/demos/performance_flamegraph_lunar_lander_rnn.py +0 -0
  165. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/demos/performance_flamegraph_rnn_memory.py +0 -0
  166. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/dependabot.yml +0 -0
  167. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/Makefile +0 -0
  168. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/__init__.py +0 -0
  169. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/_static/arena-github-badge.svg +0 -0
  170. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/_static/css/custom.css +0 -0
  171. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/_static/favicon.ico +0 -0
  172. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/_static/js/expand_sidebar.js +0 -0
  173. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/_static/logo_teal.png +0 -0
  174. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/_static/logo_white.png +0 -0
  175. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/_static/module.png +0 -0
  176. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/_static/network.png +0 -0
  177. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/_static/thumbnails/iris-thumbnail.png +0 -0
  178. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/_static/thumbnails/pendigits-thumbnail.png +0 -0
  179. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/_static/thumbnails/rainbow_performance.png +0 -0
  180. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/_static/thumbnails/simba_thumbnail.png +0 -0
  181. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/algorithms/base.rst +0 -0
  182. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/algorithms/cql.rst +0 -0
  183. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/algorithms/ddpg.rst +0 -0
  184. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/algorithms/dpo.rst +0 -0
  185. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/algorithms/dqn.rst +0 -0
  186. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/algorithms/dqn_rainbow.rst +0 -0
  187. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/algorithms/grpo.rst +0 -0
  188. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/algorithms/ilql.rst +0 -0
  189. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/algorithms/index.rst +0 -0
  190. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/algorithms/ippo.rst +0 -0
  191. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/algorithms/maddpg.rst +0 -0
  192. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/algorithms/matd3.rst +0 -0
  193. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/algorithms/neural_ts.rst +0 -0
  194. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/algorithms/neural_ucb.rst +0 -0
  195. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/algorithms/ppo.rst +0 -0
  196. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/algorithms/registry.rst +0 -0
  197. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/algorithms/td3.rst +0 -0
  198. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/algorithms/wrappers.rst +0 -0
  199. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/components/data.rst +0 -0
  200. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/components/index.rst +0 -0
  201. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/components/multi_agent_replay_buffer.rst +0 -0
  202. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/components/replay_buffer.rst +0 -0
  203. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/components/rollout_buffer.rst +0 -0
  204. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/components/sampler.rst +0 -0
  205. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/components/segment_tree.rst +0 -0
  206. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/hpo/index.rst +0 -0
  207. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/hpo/mutation.rst +0 -0
  208. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/hpo/tournament.rst +0 -0
  209. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/modules/base.rst +0 -0
  210. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/modules/bert.rst +0 -0
  211. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/modules/cnn.rst +0 -0
  212. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/modules/custom_activation.rst +0 -0
  213. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/modules/dummy.rst +0 -0
  214. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/modules/gpt.rst +0 -0
  215. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/modules/index.rst +0 -0
  216. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/modules/lstm.rst +0 -0
  217. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/modules/mlp.rst +0 -0
  218. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/modules/multi_input.rst +0 -0
  219. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/modules/resnet.rst +0 -0
  220. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/modules/simba.rst +0 -0
  221. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/networks/actors.rst +0 -0
  222. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/networks/base.rst +0 -0
  223. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/networks/index.rst +0 -0
  224. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/networks/q_networks.rst +0 -0
  225. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/networks/value_networks.rst +0 -0
  226. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/rollouts/index.rst +0 -0
  227. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/rollouts/on_policy.rst +0 -0
  228. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/train.rst +0 -0
  229. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/utils/algo_utils.rst +0 -0
  230. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/utils/cache.rst +0 -0
  231. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/utils/evolvable_networks.rst +0 -0
  232. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/utils/ilql_utils.rst +0 -0
  233. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/utils/index.rst +0 -0
  234. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/utils/llm_utils.rst +0 -0
  235. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/utils/log_utils.rst +0 -0
  236. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/utils/minari_utils.rst +0 -0
  237. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/utils/probe_envs.rst +0 -0
  238. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/utils/torch_utils.rst +0 -0
  239. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/utils/utils.rst +0 -0
  240. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/vector/index.rst +0 -0
  241. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/vector/petting_zoo_async_vector_env.rst +0 -0
  242. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/vector/petting_zoo_vector_env.rst +0 -0
  243. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/wrappers/agent.rst +0 -0
  244. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/wrappers/index.rst +0 -0
  245. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/wrappers/learning.rst +0 -0
  246. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/wrappers/make_evolvable.rst +0 -0
  247. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/wrappers/pettingzoo.rst +0 -0
  248. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/bandits/index.rst +0 -0
  249. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/conf.py +0 -0
  250. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/custom_algorithms/index.rst +0 -0
  251. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/debugging_rl/index.rst +0 -0
  252. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/distributed_training/index.rst +0 -0
  253. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/evo_hyperparam_opt/index.rst +0 -0
  254. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/evolvable_networks/index.rst +0 -0
  255. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/get_started/agilerl2changes.rst +0 -0
  256. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/get_started/index.rst +0 -0
  257. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/index.rst +0 -0
  258. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/llm_finetuning/index.rst +0 -0
  259. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/make.bat +0 -0
  260. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/multi_agent_training/index.rst +0 -0
  261. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/off_policy/index.rst +0 -0
  262. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/offline_training/index.rst +0 -0
  263. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/on_policy/index.rst +0 -0
  264. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/pomdp/index.rst +0 -0
  265. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/releases/index.rst +0 -0
  266. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/requirements.txt +0 -0
  267. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/sitecustomize.py +0 -0
  268. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/__init__.py +0 -0
  269. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/conftest.py +0 -0
  270. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/helper_functions.py +0 -0
  271. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/pz_vector_test_utils.py +0 -0
  272. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/subprocess_runner.py +0 -0
  273. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_algorithms/__init__.py +0 -0
  274. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_algorithms/test_bandits/__init__.py +0 -0
  275. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_algorithms/test_bandits/test_neural_ts.py +0 -0
  276. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_algorithms/test_bandits/test_neural_ucb.py +0 -0
  277. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_algorithms/test_base.py +0 -0
  278. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_algorithms/test_bc_lm.py +0 -0
  279. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_algorithms/test_llms/__init__.py +0 -0
  280. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_algorithms/test_llms/conftest.py +0 -0
  281. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_algorithms/test_llms/test_dpo.py +0 -0
  282. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_algorithms/test_llms/test_grpo.py +0 -0
  283. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_algorithms/test_multi_agent/__init__.py +0 -0
  284. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_algorithms/test_multi_agent/test_ippo.py +0 -0
  285. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_algorithms/test_multi_agent/test_maddpg.py +0 -0
  286. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_algorithms/test_multi_agent/test_matd3.py +0 -0
  287. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_algorithms/test_optimizer_wrapper.py +0 -0
  288. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_algorithms/test_registry.py +0 -0
  289. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_algorithms/test_single_agent/__init__.py +0 -0
  290. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_algorithms/test_single_agent/test_cqn.py +0 -0
  291. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_algorithms/test_single_agent/test_ddpg.py +0 -0
  292. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_algorithms/test_single_agent/test_dqn.py +0 -0
  293. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_algorithms/test_single_agent/test_dqn_rainbow.py +0 -0
  294. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_algorithms/test_single_agent/test_ilql.py +0 -0
  295. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_algorithms/test_single_agent/test_ppo.py +0 -0
  296. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_algorithms/test_single_agent/test_td3.py +0 -0
  297. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_components/__init__.py +0 -0
  298. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_components/test_multi_agent_replay_buffer.py +0 -0
  299. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_components/test_replay_buffer.py +0 -0
  300. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_components/test_replay_data.py +0 -0
  301. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_components/test_rollout_buffer.py +0 -0
  302. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_components/test_sampler.py +0 -0
  303. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_components/test_segment_tree.py +0 -0
  304. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_data.py +0 -0
  305. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_hpo/__init__.py +0 -0
  306. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_hpo/test_mutation.py +0 -0
  307. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_hpo/test_tournament.py +0 -0
  308. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_modules/__init__.py +0 -0
  309. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_modules/test_base.py +0 -0
  310. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_modules/test_bert.py +0 -0
  311. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_modules/test_cnn.py +0 -0
  312. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_modules/test_custom_activation.py +0 -0
  313. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_modules/test_dummy.py +0 -0
  314. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_modules/test_gpt.py +0 -0
  315. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_modules/test_lstm.py +0 -0
  316. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_modules/test_make_evolvable.py +0 -0
  317. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_modules/test_mlp.py +0 -0
  318. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_modules/test_multi_input.py +0 -0
  319. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_modules/test_resnet.py +0 -0
  320. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_modules/test_simba.py +0 -0
  321. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_networks/__init__.py +0 -0
  322. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_networks/test_actors.py +0 -0
  323. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_networks/test_base.py +0 -0
  324. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_networks/test_distributions.py +0 -0
  325. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_networks/test_q_networks.py +0 -0
  326. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_networks/test_value_functions.py +0 -0
  327. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_protocols.py +0 -0
  328. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_train/test_train.py +0 -0
  329. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_train/test_train_llm.py +0 -0
  330. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_utils/__init__.py +0 -0
  331. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_utils/test_algo_utils.py +0 -0
  332. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_utils/test_cache.py +0 -0
  333. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_utils/test_ilql_utils.py +0 -0
  334. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_utils/test_llm_utils.py +0 -0
  335. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_utils/test_log_utils.py +0 -0
  336. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_utils/test_minari_utils.py +0 -0
  337. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_utils/test_probe_envs.py +0 -0
  338. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_utils/test_probe_envs_ma.py +0 -0
  339. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_utils/test_sampling_utils.py +0 -0
  340. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_utils/test_torch_utils.py +0 -0
  341. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_utils/test_utils.py +0 -0
  342. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_utils/test_utils_evolvable.py +0 -0
  343. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_vector/test_vector.py +0 -0
  344. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_wrappers/__init__.py +0 -0
  345. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_wrappers/test_agent.py +0 -0
  346. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_wrappers/test_autoreset.py +0 -0
  347. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_wrappers/test_bandit_env.py +0 -0
  348. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_wrappers/test_skills.py +0 -0
  349. {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/utils.py +0 -0
@@ -31,7 +31,7 @@ repos:
31
31
  - --skip=*.css,*.js,*.map,*.scss,*.svg
32
32
  - --ignore-words-list=magent,pres,roate
33
33
  - repo: https://github.com/astral-sh/ruff-pre-commit
34
- rev: v0.15.1
34
+ rev: v0.15.2
35
35
  hooks:
36
36
  - id: ruff
37
37
  name: Ruff Linter
@@ -46,6 +46,6 @@ repos:
46
46
 
47
47
  - repo: https://github.com/astral-sh/uv-pre-commit
48
48
  # uv version.
49
- rev: 0.10.3
49
+ rev: 0.10.4
50
50
  hooks:
51
51
  - id: uv-lock
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: agilerl
3
- Version: 2.5.0.dev2
3
+ Version: 2.5.0.dev4
4
4
  Summary: AgileRL is a deep reinforcement learning library focused on improving RL development through RLOps.
5
5
  Author-email: Nick Ustaran-Anderegg <dev@agilerl.com>
6
6
  License-Expression: Apache-2.0
@@ -77,6 +77,7 @@ from agilerl.utils.algo_utils import (
77
77
  chkpt_attribute_to_device,
78
78
  clone_llm,
79
79
  create_warmup_cosine_scheduler,
80
+ filter_init_dict,
80
81
  get_input_size_from_space,
81
82
  get_output_size_from_space,
82
83
  isroutine,
@@ -1094,22 +1095,20 @@ class EvolvableAlgorithm(ABC, metaclass=RegistryMeta):
1094
1095
  )
1095
1096
  if isinstance(module_cls, dict):
1096
1097
  for agent_id, mod_cls in module_cls.items():
1097
- d = init_dict[agent_id]
1098
+ d = filter_init_dict(init_dict[agent_id], mod_cls)
1098
1099
  d["device"] = device
1099
1100
  mod: EvolvableModule = mod_cls(**d)
1100
1101
  loaded_modules[name][agent_id] = mod
1101
1102
  else:
1103
+ init_dict = filter_init_dict(init_dict, module_cls)
1102
1104
  init_dict["device"] = device
1103
1105
  module = module_cls(**init_dict)
1104
1106
  loaded_modules[name] = module
1105
1107
 
1106
1108
  # Reconstruct the algorithm
1107
- constructor_params = inspect.signature(cls.__init__).parameters.keys()
1108
1109
  checkpoint["accelerator"] = accelerator
1109
1110
  checkpoint["device"] = device
1110
- class_init_dict = {
1111
- k: v for k, v in checkpoint.items() if k in constructor_params
1112
- }
1111
+ class_init_dict = filter_init_dict(checkpoint, cls)
1113
1112
  self = cls(**class_init_dict)
1114
1113
  registry: MutationRegistry = checkpoint["registry"]
1115
1114
  self.registry = registry
@@ -299,7 +299,7 @@ class MADDPG(MultiAgentRLAlgorithm):
299
299
  )
300
300
  max_latent_dim = max(
301
301
  [
302
- agent_configs[agent_id].get("max_latent_dim", 128)
302
+ agent_configs[agent_id].get("max_latent_dim", 1024)
303
303
  for agent_id in self.agent_ids
304
304
  ],
305
305
  )
@@ -337,7 +337,7 @@ class MATD3(MultiAgentRLAlgorithm):
337
337
  )
338
338
  max_latent_dim = max(
339
339
  [
340
- agent_configs[agent_id].get("max_latent_dim", 128)
340
+ agent_configs[agent_id].get("max_latent_dim", 1024)
341
341
  for agent_id in self.agent_ids
342
342
  ],
343
343
  )
@@ -452,6 +452,21 @@ def chkpt_attribute_to_device(
452
452
  return chkpt_dict
453
453
 
454
454
 
455
+ def filter_init_dict(init_dict: dict[str, Any], cls: type) -> dict[str, Any]:
456
+ """Filter the init dict to only include parameters that are valid for the given class.
457
+
458
+ :param init_dict: Initialization dictionary
459
+ :type init_dict: dict[str, Any]
460
+ :param cls: Class to filter the init dict for
461
+ :type cls: type
462
+
463
+ :return: Filtered initialization dictionary
464
+ :rtype: dict[str, Any]
465
+ """
466
+ init_params = inspect.signature(cls.__init__).parameters.keys()
467
+ return {k: v for k, v in init_dict.items() if k in init_params}
468
+
469
+
455
470
  def key_in_nested_dict(nested_dict: dict[str, Any], target: str) -> bool:
456
471
  """Determine if key is in nested dictionary.
457
472
 
@@ -584,6 +599,8 @@ def format_shared_critic_encoder(encoder_configs: NetConfigType) -> dict[str, An
584
599
  if encoder_key == "mlp_config":
585
600
  encoder_config[encoder_key] = config
586
601
  encoder_config["latent_dim"] = config.get("hidden_size", [32])[-1]
602
+ encoder_config["min_latent_dim"] = config.get("min_mlp_nodes", 8)
603
+ encoder_config["max_latent_dim"] = config.get("max_mlp_nodes", 1024)
587
604
  else:
588
605
  encoder_config["init_dicts"][encoder_key] = config
589
606
 
@@ -71,7 +71,8 @@ MUTATION_PARAMS:
71
71
 
72
72
  NET_CONFIG:
73
73
  latent_dim: 64
74
-
74
+ min_latent_dim: 8
75
+ max_latent_dim: 1024
75
76
  encoder_config:
76
77
  hidden_size: [64]
77
78
  min_mlp_nodes: 64
@@ -1,7 +1,7 @@
1
1
  [project]
2
2
  name = "agilerl"
3
3
 
4
- version = "2.5.0.dev2"
4
+ version = "2.5.0.dev4"
5
5
  description = "AgileRL is a deep reinforcement learning library focused on improving RL development through RLOps."
6
6
  authors = [{ name = "Nick Ustaran-Anderegg", email = "dev@agilerl.com" }]
7
7
  license = "Apache-2.0"
@@ -52,7 +52,7 @@ wheels = [
52
52
 
53
53
  [[package]]
54
54
  name = "agilerl"
55
- version = "2.5.0.dev3"
55
+ version = "2.5.0.dev4"
56
56
  source = { editable = "." }
57
57
  dependencies = [
58
58
  { name = "accelerate" },
File without changes
File without changes
File without changes
File without changes
File without changes