stable-baselines3 2.3.0a5__tar.gz → 2.3.2__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {stable_baselines3-2.3.0a5/stable_baselines3.egg-info → stable_baselines3-2.3.2}/PKG-INFO +1 -1
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/README.md +1 -1
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/save_util.py +2 -1
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/utils.py +3 -1
- stable_baselines3-2.3.2/stable_baselines3/version.txt +1 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2/stable_baselines3.egg-info}/PKG-INFO +1 -1
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/tests/test_save_load.py +14 -0
- stable_baselines3-2.3.0a5/stable_baselines3/version.txt +0 -1
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/LICENSE +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/NOTICE +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/pyproject.toml +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/setup.cfg +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/setup.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/__init__.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/a2c/__init__.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/a2c/a2c.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/a2c/policies.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/__init__.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/atari_wrappers.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/base_class.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/buffers.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/callbacks.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/distributions.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/env_checker.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/env_util.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/envs/__init__.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/envs/bit_flipping_env.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/envs/identity_env.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/envs/multi_input_envs.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/evaluation.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/logger.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/monitor.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/noise.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/off_policy_algorithm.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/on_policy_algorithm.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/policies.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/preprocessing.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/results_plotter.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/running_mean_std.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/sb2_compat/__init__.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/sb2_compat/rmsprop_tf_like.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/torch_layers.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/type_aliases.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/vec_env/__init__.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/vec_env/base_vec_env.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/vec_env/dummy_vec_env.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/vec_env/patch_gym.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/vec_env/stacked_observations.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/vec_env/subproc_vec_env.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/vec_env/util.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/vec_env/vec_check_nan.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/vec_env/vec_extract_dict_obs.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/vec_env/vec_frame_stack.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/vec_env/vec_monitor.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/vec_env/vec_normalize.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/vec_env/vec_transpose.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/vec_env/vec_video_recorder.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/ddpg/__init__.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/ddpg/ddpg.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/ddpg/policies.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/dqn/__init__.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/dqn/dqn.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/dqn/policies.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/her/__init__.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/her/goal_selection_strategy.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/her/her_replay_buffer.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/ppo/__init__.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/ppo/policies.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/ppo/ppo.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/py.typed +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/sac/__init__.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/sac/policies.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/sac/sac.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/td3/__init__.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/td3/policies.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/td3/td3.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3.egg-info/SOURCES.txt +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3.egg-info/dependency_links.txt +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3.egg-info/requires.txt +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3.egg-info/top_level.txt +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/tests/test_buffers.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/tests/test_callbacks.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/tests/test_cnn.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/tests/test_custom_policy.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/tests/test_deterministic.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/tests/test_dict_env.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/tests/test_distributions.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/tests/test_env_checker.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/tests/test_envs.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/tests/test_gae.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/tests/test_her.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/tests/test_identity.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/tests/test_logger.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/tests/test_monitor.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/tests/test_predict.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/tests/test_preprocessing.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/tests/test_run.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/tests/test_sde.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/tests/test_spaces.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/tests/test_tensorboard.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/tests/test_train_eval_mode.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/tests/test_utils.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/tests/test_vec_check_nan.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/tests/test_vec_envs.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/tests/test_vec_extract_dict_obs.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/tests/test_vec_monitor.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/tests/test_vec_normalize.py +0 -0
- {stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/tests/test_vec_stacked_obs.py +0 -0
|
@@ -85,7 +85,7 @@ Documentation is available online: [https://sb3-contrib.readthedocs.io/](https:/
|
|
|
85
85
|
|
|
86
86
|
## Stable-Baselines Jax (SBX)
|
|
87
87
|
|
|
88
|
-
[Stable Baselines Jax (SBX)](https://github.com/araffin/sbx) is a proof of concept version of Stable-Baselines3 in Jax.
|
|
88
|
+
[Stable Baselines Jax (SBX)](https://github.com/araffin/sbx) is a proof of concept version of Stable-Baselines3 in Jax, with recent algorithms like DroQ or CrossQ.
|
|
89
89
|
|
|
90
90
|
It provides a minimal number of features compared to SB3 but can be much faster (up to 20x times!): https://twitter.com/araffin2/status/1590714558628253698
|
|
91
91
|
|
|
@@ -447,7 +447,8 @@ def load_from_zip_file(
|
|
|
447
447
|
file_content.seek(0)
|
|
448
448
|
# Load the parameters with the right ``map_location``.
|
|
449
449
|
# Remove ".pth" ending with splitext
|
|
450
|
-
|
|
450
|
+
# Note(antonin): we cannot use weights_only=True, as it breaks with PyTorch 1.13, see GH#1911
|
|
451
|
+
th_object = th.load(file_content, map_location=device, weights_only=False)
|
|
451
452
|
# "tensors.pth" was renamed "pytorch_variables.pth" in v0.9.0, see PR #138
|
|
452
453
|
if file_path == "pytorch_variables.pth" or file_path == "tensors.pth":
|
|
453
454
|
# PyTorch variables (not state_dicts)
|
|
@@ -92,7 +92,9 @@ def get_schedule_fn(value_schedule: Union[Schedule, float]) -> Schedule:
|
|
|
92
92
|
value_schedule = constant_fn(float(value_schedule))
|
|
93
93
|
else:
|
|
94
94
|
assert callable(value_schedule)
|
|
95
|
-
|
|
95
|
+
# Cast to float to avoid unpickling errors to enable weights_only=True, see GH#1900
|
|
96
|
+
# Some types are have odd behaviors when part of a Schedule, like numpy floats
|
|
97
|
+
return lambda progress_remaining: float(value_schedule(progress_remaining))
|
|
96
98
|
|
|
97
99
|
|
|
98
100
|
def get_linear_fn(start: float, end: float, end_fraction: float) -> Schedule:
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
2.3.2
|
|
@@ -783,3 +783,17 @@ def test_no_resource_warning(tmp_path):
|
|
|
783
783
|
fp.seek(0)
|
|
784
784
|
model.load_replay_buffer(fp)
|
|
785
785
|
assert not fp.closed
|
|
786
|
+
|
|
787
|
+
|
|
788
|
+
def test_cast_lr_schedule(tmp_path):
|
|
789
|
+
# See GH#1900
|
|
790
|
+
model = PPO("MlpPolicy", "Pendulum-v1", learning_rate=lambda t: t * np.sin(1.0))
|
|
791
|
+
# Note: for recent version of numpy, np.float64 is a subclass of float
|
|
792
|
+
# so we need to use type here
|
|
793
|
+
# assert isinstance(model.lr_schedule(1.0), float)
|
|
794
|
+
assert type(model.lr_schedule(1.0)) is float # noqa: E721
|
|
795
|
+
assert np.allclose(model.lr_schedule(0.5), 0.5 * np.sin(1.0))
|
|
796
|
+
model.save(tmp_path / "ppo.zip")
|
|
797
|
+
model = PPO.load(tmp_path / "ppo.zip")
|
|
798
|
+
assert type(model.lr_schedule(1.0)) is float # noqa: E721
|
|
799
|
+
assert np.allclose(model.lr_schedule(0.5), 0.5 * np.sin(1.0))
|
|
@@ -1 +0,0 @@
|
|
|
1
|
-
2.3.0a5
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/atari_wrappers.py
RENAMED
|
File without changes
|
{stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/base_class.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
{stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/distributions.py
RENAMED
|
File without changes
|
{stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/env_checker.py
RENAMED
|
File without changes
|
|
File without changes
|
{stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/envs/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
{stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/envs/identity_env.py
RENAMED
|
File without changes
|
|
File without changes
|
{stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/evaluation.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/preprocessing.py
RENAMED
|
File without changes
|
{stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/results_plotter.py
RENAMED
|
File without changes
|
{stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/running_mean_std.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
{stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/torch_layers.py
RENAMED
|
File without changes
|
{stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/type_aliases.py
RENAMED
|
File without changes
|
{stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/vec_env/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
{stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/vec_env/patch_gym.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
{stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/common/vec_env/util.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3/her/her_replay_buffer.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3.egg-info/SOURCES.txt
RENAMED
|
File without changes
|
|
File without changes
|
{stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3.egg-info/requires.txt
RENAMED
|
File without changes
|
{stable_baselines3-2.3.0a5 → stable_baselines3-2.3.2}/stable_baselines3.egg-info/top_level.txt
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|