multi-agent-rlenv 3.6.1__tar.gz → 3.6.2__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/PKG-INFO +1 -1
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/pyproject.toml +1 -1
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/src/marlenv/catalog/deepsea.py +1 -1
- multi_agent_rlenv-3.6.2/tests/test_deepsea.py +43 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/.github/workflows/ci.yaml +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/.github/workflows/docs.yaml +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/.gitignore +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/LICENSE +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/README.md +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/src/marlenv/__init__.py +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/src/marlenv/adapters/__init__.py +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/src/marlenv/adapters/gym_adapter.py +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/src/marlenv/adapters/pettingzoo_adapter.py +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/src/marlenv/adapters/pymarl_adapter.py +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/src/marlenv/adapters/smac_adapter.py +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/src/marlenv/catalog/__init__.py +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/src/marlenv/env_builder.py +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/src/marlenv/env_pool.py +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/src/marlenv/exceptions.py +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/src/marlenv/mock_env.py +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/src/marlenv/models/__init__.py +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/src/marlenv/models/env.py +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/src/marlenv/models/episode.py +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/src/marlenv/models/observation.py +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/src/marlenv/models/spaces.py +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/src/marlenv/models/state.py +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/src/marlenv/models/step.py +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/src/marlenv/models/transition.py +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/src/marlenv/py.typed +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/src/marlenv/utils/__init__.py +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/src/marlenv/utils/cached_property_collector.py +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/src/marlenv/utils/import_placeholders.py +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/src/marlenv/utils/schedule.py +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/src/marlenv/wrappers/__init__.py +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/src/marlenv/wrappers/action_randomizer.py +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/src/marlenv/wrappers/agent_id_wrapper.py +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/src/marlenv/wrappers/available_actions_mask.py +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/src/marlenv/wrappers/available_actions_wrapper.py +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/src/marlenv/wrappers/blind_wrapper.py +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/src/marlenv/wrappers/centralised.py +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/src/marlenv/wrappers/delayed_rewards.py +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/src/marlenv/wrappers/last_action_wrapper.py +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/src/marlenv/wrappers/paddings.py +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/src/marlenv/wrappers/penalty_wrapper.py +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/src/marlenv/wrappers/potential_shaping.py +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/src/marlenv/wrappers/rlenv_wrapper.py +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/src/marlenv/wrappers/time_limit.py +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/src/marlenv/wrappers/video_recorder.py +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/tests/__init__.py +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/tests/test_adapters.py +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/tests/test_catalog.py +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/tests/test_episode.py +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/tests/test_models.py +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/tests/test_others.py +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/tests/test_pool.py +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/tests/test_schedules.py +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/tests/test_serialization.py +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/tests/test_spaces.py +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/tests/test_wrappers.py +0 -0
- {multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/tests/utils.py +0 -0
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: multi-agent-rlenv
|
|
3
|
-
Version: 3.6.
|
|
3
|
+
Version: 3.6.2
|
|
4
4
|
Summary: A strongly typed Multi-Agent Reinforcement Learning framework
|
|
5
5
|
Project-URL: repository, https://github.com/yamoling/multi-agent-rlenv
|
|
6
6
|
Author-email: Yannick Molinghen <yannick.molinghen@ulb.be>
|
|
@@ -34,7 +34,7 @@ class DeepSea(MARLEnv[MultiDiscreteSpace]):
|
|
|
34
34
|
self._step_right_penalty = -0.01 / self.max_depth
|
|
35
35
|
|
|
36
36
|
def get_observation(self) -> Observation:
|
|
37
|
-
return Observation(np.array([self._row, self._col], dtype=np.float32), self.available_actions())
|
|
37
|
+
return Observation(np.array([[self._row, self._col]], dtype=np.float32), self.available_actions())
|
|
38
38
|
|
|
39
39
|
def get_state(self) -> State:
|
|
40
40
|
return State(np.array([self._row, self._col], dtype=np.float32))
|
|
@@ -0,0 +1,43 @@
|
|
|
1
|
+
from marlenv.catalog.deepsea import DeepSea, LEFT, RIGHT
|
|
2
|
+
|
|
3
|
+
|
|
4
|
+
def test_env():
|
|
5
|
+
env = DeepSea(20)
|
|
6
|
+
assert env.n_actions == 2
|
|
7
|
+
assert env.action_space.is_discrete
|
|
8
|
+
assert env.observation_shape == (2,)
|
|
9
|
+
assert env.n_agents == 1
|
|
10
|
+
|
|
11
|
+
|
|
12
|
+
def test_reset():
|
|
13
|
+
env = DeepSea(20)
|
|
14
|
+
obs, state = env.reset()
|
|
15
|
+
assert obs.shape == (2,)
|
|
16
|
+
assert state.shape == (2,)
|
|
17
|
+
|
|
18
|
+
assert obs.data[0][0] == 0
|
|
19
|
+
assert state.data[0] == 0
|
|
20
|
+
assert obs.data[0][1] == 0
|
|
21
|
+
assert state.data[1] == 0
|
|
22
|
+
|
|
23
|
+
|
|
24
|
+
def test_step():
|
|
25
|
+
env = DeepSea(20)
|
|
26
|
+
env.reset()
|
|
27
|
+
step = env.step([RIGHT])
|
|
28
|
+
obs = step.obs
|
|
29
|
+
assert obs.data[0][0] == 1
|
|
30
|
+
assert obs.data[0][1] == 1
|
|
31
|
+
assert step.reward.item() < 0
|
|
32
|
+
|
|
33
|
+
step = env.step([LEFT])
|
|
34
|
+
obs = step.obs
|
|
35
|
+
assert obs.data[0][0] == 2
|
|
36
|
+
assert obs.data[0][1] == 0
|
|
37
|
+
assert step.reward.item() == 0.0
|
|
38
|
+
|
|
39
|
+
step = env.step([LEFT])
|
|
40
|
+
obs = step.obs
|
|
41
|
+
assert obs.data[0][0] == 3
|
|
42
|
+
assert obs.data[0][1] == 0
|
|
43
|
+
assert step.reward.item() == 0.0
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/src/marlenv/adapters/pettingzoo_adapter.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/src/marlenv/utils/cached_property_collector.py
RENAMED
|
File without changes
|
{multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/src/marlenv/utils/import_placeholders.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
{multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/src/marlenv/wrappers/action_randomizer.py
RENAMED
|
File without changes
|
{multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/src/marlenv/wrappers/agent_id_wrapper.py
RENAMED
|
File without changes
|
{multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/src/marlenv/wrappers/available_actions_mask.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/src/marlenv/wrappers/last_action_wrapper.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
{multi_agent_rlenv-3.6.1 → multi_agent_rlenv-3.6.2}/src/marlenv/wrappers/potential_shaping.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|