agilerl 2.4.2.dev1__tar.gz → 2.4.3.dev0__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/.pre-commit-config.yaml +3 -3
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/PKG-INFO +1 -1
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/algorithms/core/base.py +1 -2
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/algorithms/ippo.py +1 -1
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/wrappers/agent.py +2 -2
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/pyproject.toml +1 -1
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_modules/test_make_evolvable.py +1 -4
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_train/test_train.py +18 -6
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/uv.lock +1 -1
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/.coveragerc +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/.github/ISSUE_TEMPLATE/bug_report.md +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/.github/ISSUE_TEMPLATE/feature_request.md +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/.github/PULL_REQUEST_TEMPLATE/pull_request_template.md +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/.github/badges/arena-github-badge.svg +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/.github/workflows/codeql.yml +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/.github/workflows/python-app.yml +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/.gitignore +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/.readthedocs.yaml +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/CITATION.cff +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/CODE_OF_CONDUCT.md +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/CONTRIBUTING.md +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/LICENSE +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/README.md +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/__init__.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/algorithms/__init__.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/algorithms/bc_lm.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/algorithms/core/__init__.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/algorithms/core/optimizer_wrapper.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/algorithms/core/registry.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/algorithms/cqn.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/algorithms/ddpg.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/algorithms/dpo.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/algorithms/dqn.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/algorithms/dqn_rainbow.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/algorithms/grpo.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/algorithms/ilql.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/algorithms/maddpg.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/algorithms/matd3.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/algorithms/neural_ts_bandit.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/algorithms/neural_ucb_bandit.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/algorithms/ppo.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/algorithms/td3.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/components/__init__.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/components/data.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/components/multi_agent_replay_buffer.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/components/replay_buffer.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/components/rollout_buffer.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/components/sampler.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/components/segment_tree.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/data/__init__.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/data/language_environment.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/data/rl_data.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/data/tokenizer.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/data/torch_datasets.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/hpo/__init__.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/hpo/mutation.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/hpo/tournament.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/modules/__init__.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/modules/base.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/modules/bert.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/modules/cnn.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/modules/configs.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/modules/custom_components.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/modules/dummy.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/modules/gpt.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/modules/lstm.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/modules/mlp.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/modules/multi_input.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/modules/resnet.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/modules/simba.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/networks/__init__.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/networks/actors.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/networks/base.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/networks/custom_modules.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/networks/distributions.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/networks/distributions_experimental.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/networks/q_networks.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/networks/value_networks.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/protocols.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/rollouts/__init__.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/rollouts/on_policy.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/training/__init__.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/training/train_bandits.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/training/train_llm.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/training/train_multi_agent_off_policy.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/training/train_multi_agent_on_policy.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/training/train_off_policy.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/training/train_offline.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/training/train_on_policy.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/typing.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/utils/__init__.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/utils/algo_utils.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/utils/cache.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/utils/evolvable_networks.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/utils/ilql_utils.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/utils/llm_utils.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/utils/log_utils.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/utils/minari_utils.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/utils/probe_envs.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/utils/probe_envs_ma.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/utils/sampling_utils.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/utils/torch_utils.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/utils/utils.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/vector/__init__.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/vector/pz_async_vec_env.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/vector/pz_vec_env.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/wrappers/__init__.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/wrappers/learning.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/wrappers/make_evolvable.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/wrappers/pettingzoo_wrappers.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/agilerl/wrappers/utils.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/benchmarking/benchmarking_bandits.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/benchmarking/benchmarking_dpo.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/benchmarking/benchmarking_grpo.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/benchmarking/benchmarking_multi_agent_off_policy.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/benchmarking/benchmarking_multi_agent_on_policy.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/benchmarking/benchmarking_off_policy.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/benchmarking/benchmarking_off_policy_distributed.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/benchmarking/benchmarking_offline.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/benchmarking/benchmarking_offline_distributed.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/benchmarking/benchmarking_on_policy.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/benchmarking/benchmarking_rainbow.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/benchmarking/benchmarking_recurrent.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/benchmarking/benchmarking_resnet.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/benchmarking/benchmarking_simba.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/benchmarking/configs/ds_config.json +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/benchmarking/make_evolvable_benchmarking.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/benchmarking/networks.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/configs/accelerate/accelerate.yaml +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/configs/accelerate/grpo_accelerate_config.yaml +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/configs/training/bandit/neural_ts.yaml +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/configs/training/bandit/neural_ucb.yaml +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/configs/training/cqn.yaml +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/configs/training/ddpg/ddpg.yaml +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/configs/training/ddpg/ddpg_lstm.yaml +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/configs/training/ddpg/ddpg_simba.yaml +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/configs/training/dpo.yaml +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/configs/training/dqn/dqn.yaml +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/configs/training/dqn/dqn_lstm.yaml +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/configs/training/dqn/dqn_rainbow.yaml +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/configs/training/grpo.yaml +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/configs/training/multi_agent/ippo.yaml +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/configs/training/multi_agent/ippo_pong.yaml +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/configs/training/multi_agent/maddpg.yaml +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/configs/training/multi_agent/matd3.yaml +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/configs/training/multi_input.yaml +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/configs/training/ppo/ppo.yaml +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/configs/training/ppo/ppo_image.yaml +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/configs/training/ppo/ppo_recurrent.yaml +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/configs/training/td3.yaml +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/data/cartpole/cartpole_random_v1.1.0.h5 +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/data/cartpole/cartpole_v1.1.0.h5 +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/data/pendulum/pendulum_random_v1.1.0.h5 +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/data/pendulum/pendulum_v1.1.0.h5 +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/demos/demo_bandit.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/demos/demo_custom_network.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/demos/demo_multi_agent.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/demos/demo_off_policy.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/demos/demo_off_policy_distributed.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/demos/demo_offline.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/demos/demo_offline_distributed.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/demos/demo_on_policy.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/demos/demo_on_policy_rnn_cartpole.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/demos/demo_on_policy_rnn_memory.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/demos/demo_on_policy_rnn_minigrid.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/demos/performance_flamegraph_cartpole.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/demos/performance_flamegraph_lunar_lander.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/demos/performance_flamegraph_lunar_lander_rnn.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/demos/performance_flamegraph_rnn_memory.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/dependabot.yml +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/Makefile +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/_static/arena-github-badge.svg +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/_static/css/custom.css +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/_static/favicon.ico +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/_static/js/expand_sidebar.js +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/_static/logo_teal.png +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/_static/logo_white.png +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/_static/module.png +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/_static/network.png +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/_static/thumbnails/iris-thumbnail.png +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/_static/thumbnails/pendigits-thumbnail.png +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/_static/thumbnails/rainbow_performance.png +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/_static/thumbnails/simba_thumbnail.png +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/algorithms/base.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/algorithms/cql.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/algorithms/ddpg.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/algorithms/dpo.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/algorithms/dqn.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/algorithms/dqn_rainbow.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/algorithms/grpo.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/algorithms/ilql.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/algorithms/index.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/algorithms/ippo.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/algorithms/maddpg.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/algorithms/matd3.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/algorithms/neural_ts.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/algorithms/neural_ucb.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/algorithms/ppo.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/algorithms/registry.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/algorithms/td3.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/algorithms/wrappers.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/components/data.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/components/index.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/components/multi_agent_replay_buffer.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/components/replay_buffer.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/components/rollout_buffer.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/components/sampler.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/components/segment_tree.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/hpo/index.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/hpo/mutation.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/hpo/tournament.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/modules/base.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/modules/bert.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/modules/cnn.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/modules/custom_activation.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/modules/dummy.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/modules/gpt.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/modules/index.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/modules/lstm.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/modules/mlp.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/modules/multi_input.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/modules/resnet.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/modules/simba.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/networks/actors.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/networks/base.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/networks/index.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/networks/q_networks.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/networks/value_networks.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/rollouts/index.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/rollouts/on_policy.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/train.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/utils/algo_utils.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/utils/cache.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/utils/evolvable_networks.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/utils/ilql_utils.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/utils/index.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/utils/llm_utils.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/utils/log_utils.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/utils/minari_utils.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/utils/probe_envs.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/utils/torch_utils.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/utils/utils.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/vector/index.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/vector/petting_zoo_async_vector_env.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/vector/petting_zoo_vector_env.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/wrappers/agent.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/wrappers/index.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/wrappers/learning.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/wrappers/make_evolvable.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/api/wrappers/pettingzoo.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/bandits/index.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/conf.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/custom_algorithms/index.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/debugging_rl/index.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/distributed_training/index.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/evo_hyperparam_opt/index.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/evolvable_networks/index.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/get_started/agilerl2changes.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/get_started/index.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/index.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/llm_finetuning/index.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/make.bat +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/multi_agent_training/index.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/off_policy/index.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/offline_training/index.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/on_policy/index.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/pomdp/index.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/releases/index.rst +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/docs/requirements.txt +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/pytest.ini +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/__init__.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/conftest.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/helper_functions.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/pz_vector_test_utils.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_algorithms/__init__.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_algorithms/test_bandits/__init__.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_algorithms/test_bandits/test_neural_ts.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_algorithms/test_bandits/test_neural_ucb.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_algorithms/test_base.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_algorithms/test_bc_lm.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_algorithms/test_llms/__init__.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_algorithms/test_llms/conftest.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_algorithms/test_llms/test_dpo.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_algorithms/test_llms/test_grpo.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_algorithms/test_multi_agent/__init__.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_algorithms/test_multi_agent/test_ippo.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_algorithms/test_multi_agent/test_maddpg.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_algorithms/test_multi_agent/test_matd3.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_algorithms/test_optimizer_wrapper.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_algorithms/test_registry.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_algorithms/test_single_agent/__init__.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_algorithms/test_single_agent/test_cqn.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_algorithms/test_single_agent/test_ddpg.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_algorithms/test_single_agent/test_dqn.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_algorithms/test_single_agent/test_dqn_rainbow.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_algorithms/test_single_agent/test_ilql.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_algorithms/test_single_agent/test_ppo.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_algorithms/test_single_agent/test_td3.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_components/__init__.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_components/test_multi_agent_replay_buffer.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_components/test_replay_buffer.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_components/test_replay_data.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_components/test_rollout_buffer.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_components/test_sampler.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_components/test_segment_tree.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_data.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_hpo/__init__.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_hpo/test_mutation.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_hpo/test_tournament.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_modules/__init__.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_modules/test_base.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_modules/test_bert.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_modules/test_cnn.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_modules/test_custom_activation.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_modules/test_dummy.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_modules/test_gpt.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_modules/test_lstm.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_modules/test_mlp.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_modules/test_multi_input.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_modules/test_resnet.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_modules/test_simba.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_networks/__init__.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_networks/test_actors.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_networks/test_base.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_networks/test_q_networks.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_networks/test_value_functions.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_protocols.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_train/test_train_llm.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_utils/__init__.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_utils/test_algo_utils.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_utils/test_cache.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_utils/test_ilql_utils.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_utils/test_llm_utils.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_utils/test_log_utils.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_utils/test_minari_utils.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_utils/test_probe_envs.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_utils/test_probe_envs_ma.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_utils/test_sampling_utils.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_utils/test_torch_utils.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_utils/test_utils.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_utils/test_utils_evolvable.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_vector/test_vector.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_wrappers/__init__.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_wrappers/test_agent.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_wrappers/test_autoreset.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_wrappers/test_bandit_env.py +0 -0
- {agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/tests/test_wrappers/test_skills.py +0 -0
|
@@ -24,7 +24,7 @@ repos:
|
|
|
24
24
|
- id: mixed-line-ending
|
|
25
25
|
args: [--fix=lf]
|
|
26
26
|
- repo: https://github.com/psf/black-pre-commit-mirror
|
|
27
|
-
rev:
|
|
27
|
+
rev: 26.1.0
|
|
28
28
|
hooks:
|
|
29
29
|
- id: black
|
|
30
30
|
- repo: https://github.com/codespell-project/codespell
|
|
@@ -35,7 +35,7 @@ repos:
|
|
|
35
35
|
- --skip=*.css,*.js,*.map,*.scss,*.svg
|
|
36
36
|
- --ignore-words-list=magent,pres,roate
|
|
37
37
|
- repo: https://github.com/astral-sh/ruff-pre-commit
|
|
38
|
-
rev: v0.14.
|
|
38
|
+
rev: v0.14.14
|
|
39
39
|
hooks:
|
|
40
40
|
- id: ruff-check
|
|
41
41
|
args:
|
|
@@ -53,6 +53,6 @@ repos:
|
|
|
53
53
|
- id: yamlfmt
|
|
54
54
|
- repo: https://github.com/astral-sh/uv-pre-commit
|
|
55
55
|
# uv version.
|
|
56
|
-
rev: 0.9.
|
|
56
|
+
rev: 0.9.28
|
|
57
57
|
hooks:
|
|
58
58
|
- id: uv-lock
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: agilerl
|
|
3
|
-
Version: 2.4.
|
|
3
|
+
Version: 2.4.3.dev0
|
|
4
4
|
Summary: AgileRL is a deep reinforcement learning library focused on improving RL development through RLOps.
|
|
5
5
|
Author-email: Nick Ustaran-Anderegg <dev@agilerl.com>
|
|
6
6
|
License-Expression: Apache-2.0
|
|
@@ -2066,8 +2066,7 @@ class LLMAlgorithm(EvolvableAlgorithm, ABC):
|
|
|
2066
2066
|
accelerator: Optional[Accelerator] = None,
|
|
2067
2067
|
) -> None:
|
|
2068
2068
|
raise NotImplementedError(
|
|
2069
|
-
"The load class method is not supported for this algorithm class."
|
|
2070
|
-
"""
|
|
2069
|
+
"The load class method is not supported for this algorithm class." """
|
|
2071
2070
|
To load a saved LLM, please load the model as follows, and then re-instantiate the GRPO
|
|
2072
2071
|
class, using the pre-trained model.
|
|
2073
2072
|
|
|
@@ -671,7 +671,7 @@ class IPPO(MultiAgentRLAlgorithm):
|
|
|
671
671
|
:param action_space: Action space for the agent
|
|
672
672
|
:type action_space: gymnasium.spaces
|
|
673
673
|
"""
|
|
674
|
-
|
|
674
|
+
states, actions, log_probs, rewards, dones, values, next_state, next_done = (
|
|
675
675
|
experiences
|
|
676
676
|
)
|
|
677
677
|
|
|
@@ -597,8 +597,8 @@ class AsyncAgentsWrapper(AgentWrapper[MultiAgentRLAlgorithm]):
|
|
|
597
597
|
:return: Learning information
|
|
598
598
|
:rtype: Any
|
|
599
599
|
"""
|
|
600
|
-
|
|
601
|
-
|
|
600
|
+
states, actions, log_probs, rewards, dones, values, next_state, next_done = map(
|
|
601
|
+
self.stack_experiences, experiences
|
|
602
602
|
)
|
|
603
603
|
|
|
604
604
|
# Handle case where we haven't collected a next state for each sub-agent
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
[project]
|
|
2
2
|
name = "agilerl"
|
|
3
|
-
version = "2.4.
|
|
3
|
+
version = "2.4.3.dev0"
|
|
4
4
|
description = "AgileRL is a deep reinforcement learning library focused on improving RL development through RLOps."
|
|
5
5
|
authors = [{ name = "Nick Ustaran-Anderegg", email = "dev@agilerl.com" }]
|
|
6
6
|
license = "Apache-2.0"
|
|
@@ -194,9 +194,7 @@ def test_instantiation_with_rainbow():
|
|
|
194
194
|
network, input_tensor, support=support, rainbow=True
|
|
195
195
|
)
|
|
196
196
|
assert isinstance(evolvable_network, MakeEvolvable)
|
|
197
|
-
assert (
|
|
198
|
-
str(evolvable_network)
|
|
199
|
-
== """MakeEvolvable(
|
|
197
|
+
assert str(evolvable_network) == """MakeEvolvable(
|
|
200
198
|
(feature_net): Sequential(
|
|
201
199
|
(feature_linear_layer_0): Linear(in_features=3, out_features=128, bias=True)
|
|
202
200
|
(feature_activation_0): ReLU()
|
|
@@ -212,7 +210,6 @@ def test_instantiation_with_rainbow():
|
|
|
212
210
|
(advantage_linear_layer_output): NoisyLinear(in_features=8, out_features=102)
|
|
213
211
|
)
|
|
214
212
|
)"""
|
|
215
|
-
)
|
|
216
213
|
del network, evolvable_network
|
|
217
214
|
|
|
218
215
|
|
|
@@ -1498,8 +1498,10 @@ def test_train_off_policy_agent_calls_made_rainbow(
|
|
|
1498
1498
|
def test_train_off_policy_save_elite_warning(
|
|
1499
1499
|
env, population_off_policy, tournament, mutations, memory
|
|
1500
1500
|
):
|
|
1501
|
-
warning_string =
|
|
1501
|
+
warning_string = (
|
|
1502
|
+
"'save_elite' set to False but 'elite_path' has been defined, elite will not\
|
|
1502
1503
|
be saved unless 'save_elite' is set to True."
|
|
1504
|
+
)
|
|
1503
1505
|
with pytest.warns(match=warning_string):
|
|
1504
1506
|
pop, pop_fitnesses = train_off_policy(
|
|
1505
1507
|
env,
|
|
@@ -2137,8 +2139,10 @@ def test_train_on_policy_save_elite_warning(
|
|
|
2137
2139
|
tournament,
|
|
2138
2140
|
mutations,
|
|
2139
2141
|
):
|
|
2140
|
-
warning_string =
|
|
2142
|
+
warning_string = (
|
|
2143
|
+
"'save_elite' set to False but 'elite_path' has been defined, elite will not\
|
|
2141
2144
|
be saved unless 'save_elite' is set to True."
|
|
2145
|
+
)
|
|
2142
2146
|
with pytest.warns(match=warning_string):
|
|
2143
2147
|
pop, pop_fitnesses = train_on_policy(
|
|
2144
2148
|
env,
|
|
@@ -2703,8 +2707,10 @@ def test_train_multi_agent_on_policy_rgb_vectorized(
|
|
|
2703
2707
|
def test_train_multi_save_elite_warning(
|
|
2704
2708
|
multi_env, population_multi_agent, on_policy, multi_memory, tournament, mutations
|
|
2705
2709
|
):
|
|
2706
|
-
warning_string =
|
|
2710
|
+
warning_string = (
|
|
2711
|
+
"'save_elite' set to False but 'elite_path' has been defined, elite will not\
|
|
2707
2712
|
be saved unless 'save_elite' is set to True."
|
|
2713
|
+
)
|
|
2708
2714
|
with pytest.warns(match=warning_string):
|
|
2709
2715
|
pop, pop_fitnesses = train_multi_agent_off_policy(
|
|
2710
2716
|
multi_env,
|
|
@@ -2730,8 +2736,10 @@ def test_train_multi_save_elite_warning(
|
|
|
2730
2736
|
def test_train_multi_save_elite_warning_on_policy(
|
|
2731
2737
|
multi_env, population_multi_agent, on_policy, multi_memory, tournament, mutations
|
|
2732
2738
|
):
|
|
2733
|
-
warning_string =
|
|
2739
|
+
warning_string = (
|
|
2740
|
+
"'save_elite' set to False but 'elite_path' has been defined, elite will not\
|
|
2734
2741
|
be saved unless 'save_elite' is set to True."
|
|
2742
|
+
)
|
|
2735
2743
|
with pytest.warns(match=warning_string):
|
|
2736
2744
|
pop, pop_fitnesses = train_multi_agent_on_policy(
|
|
2737
2745
|
multi_env,
|
|
@@ -3567,8 +3575,10 @@ def test_train_offline_save_elite_warning(
|
|
|
3567
3575
|
offline_init_hp,
|
|
3568
3576
|
dummy_h5py_data,
|
|
3569
3577
|
):
|
|
3570
|
-
warning_string =
|
|
3578
|
+
warning_string = (
|
|
3579
|
+
"'save_elite' set to False but 'elite_path' has been defined, elite will not\
|
|
3571
3580
|
be saved unless 'save_elite' is set to True."
|
|
3581
|
+
)
|
|
3572
3582
|
with pytest.warns(match=warning_string):
|
|
3573
3583
|
pop, pop_fitness = train_offline(
|
|
3574
3584
|
env,
|
|
@@ -4057,8 +4067,10 @@ def test_train_bandit_agent_calls_made(
|
|
|
4057
4067
|
def test_train_bandit_save_elite_warning(
|
|
4058
4068
|
bandit_env, population_bandit, tournament, mutations, bandit_memory
|
|
4059
4069
|
):
|
|
4060
|
-
warning_string =
|
|
4070
|
+
warning_string = (
|
|
4071
|
+
"'save_elite' set to False but 'elite_path' has been defined, elite will not\
|
|
4061
4072
|
be saved unless 'save_elite' is set to True."
|
|
4073
|
+
)
|
|
4062
4074
|
with pytest.warns(match=warning_string):
|
|
4063
4075
|
pop, pop_fitnesses = train_bandits(
|
|
4064
4076
|
bandit_env,
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/.github/PULL_REQUEST_TEMPLATE/pull_request_template.md
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/benchmarking/benchmarking_multi_agent_off_policy.py
RENAMED
|
File without changes
|
{agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/benchmarking/benchmarking_multi_agent_on_policy.py
RENAMED
|
File without changes
|
|
File without changes
|
{agilerl-2.4.2.dev1 → agilerl-2.4.3.dev0}/benchmarking/benchmarking_off_policy_distributed.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|