agilerl 2.5.0.dev2__tar.gz → 2.5.0.dev4__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/.pre-commit-config.yaml +2 -2
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/PKG-INFO +1 -1
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/algorithms/core/base.py +4 -5
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/algorithms/maddpg.py +1 -1
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/algorithms/matd3.py +1 -1
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/utils/algo_utils.py +17 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/configs/training/multi_agent/maddpg.yaml +2 -1
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/pyproject.toml +1 -1
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/uv.lock +1 -1
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/.github/ISSUE_TEMPLATE/bug_report.md +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/.github/ISSUE_TEMPLATE/feature_request.md +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/.github/PULL_REQUEST_TEMPLATE/pull_request_template.md +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/.github/badges/arena-github-badge.svg +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/.github/workflows/codeql.yml +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/.github/workflows/python-app.yml +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/.gitignore +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/.readthedocs.yaml +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/CITATION.cff +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/CODE_OF_CONDUCT.md +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/CONTRIBUTING.md +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/LICENSE +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/README.md +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/__init__.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/algorithms/__init__.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/algorithms/bc_lm.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/algorithms/core/__init__.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/algorithms/core/optimizer_wrapper.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/algorithms/core/registry.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/algorithms/cqn.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/algorithms/ddpg.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/algorithms/dpo.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/algorithms/dqn.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/algorithms/dqn_rainbow.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/algorithms/grpo.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/algorithms/ilql.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/algorithms/ippo.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/algorithms/neural_ts_bandit.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/algorithms/neural_ucb_bandit.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/algorithms/ppo.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/algorithms/td3.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/components/__init__.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/components/data.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/components/multi_agent_replay_buffer.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/components/replay_buffer.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/components/rollout_buffer.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/components/sampler.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/components/segment_tree.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/data/__init__.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/data/language_environment.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/data/rl_data.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/data/tokenizer.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/data/torch_datasets.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/hpo/__init__.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/hpo/mutation.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/hpo/tournament.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/modules/__init__.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/modules/base.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/modules/bert.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/modules/cnn.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/modules/configs.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/modules/custom_components.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/modules/dummy.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/modules/gpt.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/modules/lstm.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/modules/mlp.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/modules/multi_input.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/modules/resnet.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/modules/simba.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/networks/__init__.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/networks/actors.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/networks/base.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/networks/custom_modules.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/networks/distributions.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/networks/q_networks.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/networks/value_networks.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/protocols.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/rollouts/__init__.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/rollouts/on_policy.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/training/__init__.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/training/train_bandits.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/training/train_llm.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/training/train_multi_agent_off_policy.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/training/train_multi_agent_on_policy.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/training/train_off_policy.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/training/train_offline.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/training/train_on_policy.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/typing.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/utils/__init__.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/utils/cache.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/utils/evolvable_networks.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/utils/ilql_utils.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/utils/llm_utils.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/utils/log_utils.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/utils/minari_utils.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/utils/probe_envs.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/utils/probe_envs_ma.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/utils/sampling_utils.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/utils/torch_utils.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/utils/utils.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/vector/__init__.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/vector/pz_async_vec_env.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/vector/pz_vec_env.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/wrappers/__init__.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/wrappers/agent.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/wrappers/learning.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/wrappers/make_evolvable.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/wrappers/pettingzoo_wrappers.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/agilerl/wrappers/utils.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/benchmarking/benchmarking_bandits.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/benchmarking/benchmarking_dpo.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/benchmarking/benchmarking_grpo.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/benchmarking/benchmarking_multi_agent_off_policy.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/benchmarking/benchmarking_multi_agent_on_policy.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/benchmarking/benchmarking_off_policy.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/benchmarking/benchmarking_off_policy_distributed.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/benchmarking/benchmarking_offline.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/benchmarking/benchmarking_offline_distributed.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/benchmarking/benchmarking_on_policy.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/benchmarking/benchmarking_rainbow.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/benchmarking/benchmarking_recurrent.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/benchmarking/benchmarking_resnet.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/benchmarking/benchmarking_simba.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/benchmarking/configs/ds_config.json +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/benchmarking/make_evolvable_benchmarking.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/benchmarking/networks.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/configs/accelerate/accelerate.yaml +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/configs/accelerate/grpo_accelerate_config.yaml +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/configs/training/bandit/neural_ts.yaml +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/configs/training/bandit/neural_ucb.yaml +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/configs/training/cqn.yaml +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/configs/training/ddpg/ddpg.yaml +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/configs/training/ddpg/ddpg_lstm.yaml +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/configs/training/ddpg/ddpg_simba.yaml +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/configs/training/dpo.yaml +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/configs/training/dqn/dqn.yaml +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/configs/training/dqn/dqn_lstm.yaml +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/configs/training/dqn/dqn_rainbow.yaml +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/configs/training/grpo.yaml +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/configs/training/multi_agent/ippo.yaml +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/configs/training/multi_agent/ippo_pong.yaml +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/configs/training/multi_agent/matd3.yaml +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/configs/training/multi_input.yaml +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/configs/training/ppo/ppo.yaml +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/configs/training/ppo/ppo_image.yaml +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/configs/training/ppo/ppo_recurrent.yaml +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/configs/training/td3.yaml +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/data/cartpole/cartpole_random_v1.1.0.h5 +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/data/cartpole/cartpole_v1.1.0.h5 +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/data/pendulum/pendulum_random_v1.1.0.h5 +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/data/pendulum/pendulum_v1.1.0.h5 +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/demos/demo_bandit.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/demos/demo_custom_network.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/demos/demo_multi_agent.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/demos/demo_off_policy.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/demos/demo_off_policy_distributed.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/demos/demo_offline.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/demos/demo_offline_distributed.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/demos/demo_on_policy.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/demos/demo_on_policy_rnn_cartpole.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/demos/demo_on_policy_rnn_memory.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/demos/demo_on_policy_rnn_minigrid.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/demos/performance_flamegraph_cartpole.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/demos/performance_flamegraph_lunar_lander.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/demos/performance_flamegraph_lunar_lander_rnn.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/demos/performance_flamegraph_rnn_memory.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/dependabot.yml +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/Makefile +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/__init__.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/_static/arena-github-badge.svg +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/_static/css/custom.css +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/_static/favicon.ico +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/_static/js/expand_sidebar.js +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/_static/logo_teal.png +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/_static/logo_white.png +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/_static/module.png +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/_static/network.png +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/_static/thumbnails/iris-thumbnail.png +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/_static/thumbnails/pendigits-thumbnail.png +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/_static/thumbnails/rainbow_performance.png +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/_static/thumbnails/simba_thumbnail.png +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/algorithms/base.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/algorithms/cql.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/algorithms/ddpg.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/algorithms/dpo.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/algorithms/dqn.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/algorithms/dqn_rainbow.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/algorithms/grpo.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/algorithms/ilql.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/algorithms/index.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/algorithms/ippo.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/algorithms/maddpg.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/algorithms/matd3.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/algorithms/neural_ts.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/algorithms/neural_ucb.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/algorithms/ppo.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/algorithms/registry.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/algorithms/td3.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/algorithms/wrappers.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/components/data.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/components/index.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/components/multi_agent_replay_buffer.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/components/replay_buffer.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/components/rollout_buffer.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/components/sampler.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/components/segment_tree.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/hpo/index.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/hpo/mutation.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/hpo/tournament.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/modules/base.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/modules/bert.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/modules/cnn.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/modules/custom_activation.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/modules/dummy.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/modules/gpt.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/modules/index.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/modules/lstm.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/modules/mlp.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/modules/multi_input.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/modules/resnet.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/modules/simba.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/networks/actors.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/networks/base.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/networks/index.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/networks/q_networks.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/networks/value_networks.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/rollouts/index.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/rollouts/on_policy.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/train.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/utils/algo_utils.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/utils/cache.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/utils/evolvable_networks.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/utils/ilql_utils.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/utils/index.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/utils/llm_utils.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/utils/log_utils.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/utils/minari_utils.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/utils/probe_envs.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/utils/torch_utils.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/utils/utils.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/vector/index.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/vector/petting_zoo_async_vector_env.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/vector/petting_zoo_vector_env.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/wrappers/agent.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/wrappers/index.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/wrappers/learning.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/wrappers/make_evolvable.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/api/wrappers/pettingzoo.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/bandits/index.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/conf.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/custom_algorithms/index.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/debugging_rl/index.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/distributed_training/index.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/evo_hyperparam_opt/index.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/evolvable_networks/index.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/get_started/agilerl2changes.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/get_started/index.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/index.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/llm_finetuning/index.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/make.bat +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/multi_agent_training/index.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/off_policy/index.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/offline_training/index.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/on_policy/index.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/pomdp/index.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/releases/index.rst +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/docs/requirements.txt +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/sitecustomize.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/__init__.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/conftest.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/helper_functions.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/pz_vector_test_utils.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/subprocess_runner.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_algorithms/__init__.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_algorithms/test_bandits/__init__.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_algorithms/test_bandits/test_neural_ts.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_algorithms/test_bandits/test_neural_ucb.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_algorithms/test_base.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_algorithms/test_bc_lm.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_algorithms/test_llms/__init__.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_algorithms/test_llms/conftest.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_algorithms/test_llms/test_dpo.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_algorithms/test_llms/test_grpo.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_algorithms/test_multi_agent/__init__.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_algorithms/test_multi_agent/test_ippo.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_algorithms/test_multi_agent/test_maddpg.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_algorithms/test_multi_agent/test_matd3.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_algorithms/test_optimizer_wrapper.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_algorithms/test_registry.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_algorithms/test_single_agent/__init__.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_algorithms/test_single_agent/test_cqn.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_algorithms/test_single_agent/test_ddpg.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_algorithms/test_single_agent/test_dqn.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_algorithms/test_single_agent/test_dqn_rainbow.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_algorithms/test_single_agent/test_ilql.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_algorithms/test_single_agent/test_ppo.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_algorithms/test_single_agent/test_td3.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_components/__init__.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_components/test_multi_agent_replay_buffer.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_components/test_replay_buffer.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_components/test_replay_data.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_components/test_rollout_buffer.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_components/test_sampler.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_components/test_segment_tree.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_data.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_hpo/__init__.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_hpo/test_mutation.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_hpo/test_tournament.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_modules/__init__.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_modules/test_base.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_modules/test_bert.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_modules/test_cnn.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_modules/test_custom_activation.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_modules/test_dummy.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_modules/test_gpt.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_modules/test_lstm.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_modules/test_make_evolvable.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_modules/test_mlp.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_modules/test_multi_input.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_modules/test_resnet.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_modules/test_simba.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_networks/__init__.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_networks/test_actors.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_networks/test_base.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_networks/test_distributions.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_networks/test_q_networks.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_networks/test_value_functions.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_protocols.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_train/test_train.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_train/test_train_llm.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_utils/__init__.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_utils/test_algo_utils.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_utils/test_cache.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_utils/test_ilql_utils.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_utils/test_llm_utils.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_utils/test_log_utils.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_utils/test_minari_utils.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_utils/test_probe_envs.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_utils/test_probe_envs_ma.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_utils/test_sampling_utils.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_utils/test_torch_utils.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_utils/test_utils.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_utils/test_utils_evolvable.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_vector/test_vector.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_wrappers/__init__.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_wrappers/test_agent.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_wrappers/test_autoreset.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_wrappers/test_bandit_env.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/test_wrappers/test_skills.py +0 -0
- {agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/tests/utils.py +0 -0
|
@@ -31,7 +31,7 @@ repos:
|
|
|
31
31
|
- --skip=*.css,*.js,*.map,*.scss,*.svg
|
|
32
32
|
- --ignore-words-list=magent,pres,roate
|
|
33
33
|
- repo: https://github.com/astral-sh/ruff-pre-commit
|
|
34
|
-
rev: v0.15.
|
|
34
|
+
rev: v0.15.2
|
|
35
35
|
hooks:
|
|
36
36
|
- id: ruff
|
|
37
37
|
name: Ruff Linter
|
|
@@ -46,6 +46,6 @@ repos:
|
|
|
46
46
|
|
|
47
47
|
- repo: https://github.com/astral-sh/uv-pre-commit
|
|
48
48
|
# uv version.
|
|
49
|
-
rev: 0.10.
|
|
49
|
+
rev: 0.10.4
|
|
50
50
|
hooks:
|
|
51
51
|
- id: uv-lock
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: agilerl
|
|
3
|
-
Version: 2.5.0.
|
|
3
|
+
Version: 2.5.0.dev4
|
|
4
4
|
Summary: AgileRL is a deep reinforcement learning library focused on improving RL development through RLOps.
|
|
5
5
|
Author-email: Nick Ustaran-Anderegg <dev@agilerl.com>
|
|
6
6
|
License-Expression: Apache-2.0
|
|
@@ -77,6 +77,7 @@ from agilerl.utils.algo_utils import (
|
|
|
77
77
|
chkpt_attribute_to_device,
|
|
78
78
|
clone_llm,
|
|
79
79
|
create_warmup_cosine_scheduler,
|
|
80
|
+
filter_init_dict,
|
|
80
81
|
get_input_size_from_space,
|
|
81
82
|
get_output_size_from_space,
|
|
82
83
|
isroutine,
|
|
@@ -1094,22 +1095,20 @@ class EvolvableAlgorithm(ABC, metaclass=RegistryMeta):
|
|
|
1094
1095
|
)
|
|
1095
1096
|
if isinstance(module_cls, dict):
|
|
1096
1097
|
for agent_id, mod_cls in module_cls.items():
|
|
1097
|
-
d = init_dict[agent_id]
|
|
1098
|
+
d = filter_init_dict(init_dict[agent_id], mod_cls)
|
|
1098
1099
|
d["device"] = device
|
|
1099
1100
|
mod: EvolvableModule = mod_cls(**d)
|
|
1100
1101
|
loaded_modules[name][agent_id] = mod
|
|
1101
1102
|
else:
|
|
1103
|
+
init_dict = filter_init_dict(init_dict, module_cls)
|
|
1102
1104
|
init_dict["device"] = device
|
|
1103
1105
|
module = module_cls(**init_dict)
|
|
1104
1106
|
loaded_modules[name] = module
|
|
1105
1107
|
|
|
1106
1108
|
# Reconstruct the algorithm
|
|
1107
|
-
constructor_params = inspect.signature(cls.__init__).parameters.keys()
|
|
1108
1109
|
checkpoint["accelerator"] = accelerator
|
|
1109
1110
|
checkpoint["device"] = device
|
|
1110
|
-
class_init_dict =
|
|
1111
|
-
k: v for k, v in checkpoint.items() if k in constructor_params
|
|
1112
|
-
}
|
|
1111
|
+
class_init_dict = filter_init_dict(checkpoint, cls)
|
|
1113
1112
|
self = cls(**class_init_dict)
|
|
1114
1113
|
registry: MutationRegistry = checkpoint["registry"]
|
|
1115
1114
|
self.registry = registry
|
|
@@ -452,6 +452,21 @@ def chkpt_attribute_to_device(
|
|
|
452
452
|
return chkpt_dict
|
|
453
453
|
|
|
454
454
|
|
|
455
|
+
def filter_init_dict(init_dict: dict[str, Any], cls: type) -> dict[str, Any]:
|
|
456
|
+
"""Filter the init dict to only include parameters that are valid for the given class.
|
|
457
|
+
|
|
458
|
+
:param init_dict: Initialization dictionary
|
|
459
|
+
:type init_dict: dict[str, Any]
|
|
460
|
+
:param cls: Class to filter the init dict for
|
|
461
|
+
:type cls: type
|
|
462
|
+
|
|
463
|
+
:return: Filtered initialization dictionary
|
|
464
|
+
:rtype: dict[str, Any]
|
|
465
|
+
"""
|
|
466
|
+
init_params = inspect.signature(cls.__init__).parameters.keys()
|
|
467
|
+
return {k: v for k, v in init_dict.items() if k in init_params}
|
|
468
|
+
|
|
469
|
+
|
|
455
470
|
def key_in_nested_dict(nested_dict: dict[str, Any], target: str) -> bool:
|
|
456
471
|
"""Determine if key is in nested dictionary.
|
|
457
472
|
|
|
@@ -584,6 +599,8 @@ def format_shared_critic_encoder(encoder_configs: NetConfigType) -> dict[str, An
|
|
|
584
599
|
if encoder_key == "mlp_config":
|
|
585
600
|
encoder_config[encoder_key] = config
|
|
586
601
|
encoder_config["latent_dim"] = config.get("hidden_size", [32])[-1]
|
|
602
|
+
encoder_config["min_latent_dim"] = config.get("min_mlp_nodes", 8)
|
|
603
|
+
encoder_config["max_latent_dim"] = config.get("max_mlp_nodes", 1024)
|
|
587
604
|
else:
|
|
588
605
|
encoder_config["init_dicts"][encoder_key] = config
|
|
589
606
|
|
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
[project]
|
|
2
2
|
name = "agilerl"
|
|
3
3
|
|
|
4
|
-
version = "2.5.0.
|
|
4
|
+
version = "2.5.0.dev4"
|
|
5
5
|
description = "AgileRL is a deep reinforcement learning library focused on improving RL development through RLOps."
|
|
6
6
|
authors = [{ name = "Nick Ustaran-Anderegg", email = "dev@agilerl.com" }]
|
|
7
7
|
license = "Apache-2.0"
|
|
File without changes
|
|
File without changes
|
{agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/.github/PULL_REQUEST_TEMPLATE/pull_request_template.md
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/benchmarking/benchmarking_multi_agent_off_policy.py
RENAMED
|
File without changes
|
{agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/benchmarking/benchmarking_multi_agent_on_policy.py
RENAMED
|
File without changes
|
|
File without changes
|
{agilerl-2.5.0.dev2 → agilerl-2.5.0.dev4}/benchmarking/benchmarking_off_policy_distributed.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|