gym-examples 3.0.757__py3-none-any.whl → 3.0.759__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- gym_examples/__init__.py +1 -1
- gym_examples/envs/wsn_env.py +16 -16
- {gym_examples-3.0.757.dist-info → gym_examples-3.0.759.dist-info}/METADATA +1 -1
- gym_examples-3.0.759.dist-info/RECORD +7 -0
- gym_examples-3.0.757.dist-info/RECORD +0 -7
- {gym_examples-3.0.757.dist-info → gym_examples-3.0.759.dist-info}/WHEEL +0 -0
- {gym_examples-3.0.757.dist-info → gym_examples-3.0.759.dist-info}/top_level.txt +0 -0
gym_examples/__init__.py
CHANGED
gym_examples/envs/wsn_env.py
CHANGED
@@ -51,8 +51,8 @@ class ScalarAttentionModel(nn.Module):
|
|
51
51
|
scalar_output = self.output_layer(attention_output)
|
52
52
|
return scalar_output
|
53
53
|
|
54
|
-
|
55
|
-
|
54
|
+
net = ScalarAttentionModel(input_dim)
|
55
|
+
net = net.double() # Convert the weights to Double
|
56
56
|
|
57
57
|
class WSNRoutingEnv(gym.Env):
|
58
58
|
|
@@ -212,7 +212,7 @@ class WSNRoutingEnv(gym.Env):
|
|
212
212
|
|
213
213
|
self.number_of_packets[i] = 0 # Reset the number of packets of the sensor i
|
214
214
|
# Calculate final reward
|
215
|
-
|
215
|
+
rewards[i] = self.compute_attention_rewards(rewards[i])
|
216
216
|
# rewards[i] = np.mean(rewards[i])
|
217
217
|
|
218
218
|
# Integrate the mobility of the sensors
|
@@ -226,8 +226,7 @@ class WSNRoutingEnv(gym.Env):
|
|
226
226
|
self.get_metrics()
|
227
227
|
|
228
228
|
# rewards = [reward.item() if isinstance(reward, torch.Tensor) else reward for reward in rewards] # Convert the reward to a float
|
229
|
-
rewards =
|
230
|
-
# rewards = np.mean(rewards)
|
229
|
+
rewards = np.mean(rewards)
|
231
230
|
|
232
231
|
for i in range(self.n_sensors):
|
233
232
|
if not dones[i]:
|
@@ -464,20 +463,21 @@ class WSNRoutingEnv(gym.Env):
|
|
464
463
|
return np.clip(normalized_throughput, 0, 1)
|
465
464
|
|
466
465
|
|
467
|
-
def compute_attention_rewards(self,
|
466
|
+
def compute_attention_rewards(self, reward):
|
468
467
|
'''
|
469
468
|
Compute the attention-based rewards
|
470
469
|
'''
|
471
|
-
|
472
|
-
|
473
|
-
|
474
|
-
|
475
|
-
|
476
|
-
|
477
|
-
|
478
|
-
|
479
|
-
|
480
|
-
|
470
|
+
rewards_i = torch.tensor(reward, dtype=torch.double)
|
471
|
+
rewards_i = rewards_i.unsqueeze(0) # Add batch dimension
|
472
|
+
print(f"rewards_i: {rewards_i}")
|
473
|
+
print(f"rewards_i shape: {rewards_i.shape}")
|
474
|
+
print(f"rewards_i type: {rewards_i.dtype}")
|
475
|
+
print(f"net(rewards_i): {net(rewards_i)}")
|
476
|
+
print(f"net(rewards_i) shape: {net(rewards_i).shape}")
|
477
|
+
print(f"net(rewards_i) type: {net(rewards_i).dtype}")
|
478
|
+
print(f"net(rewards_i).item(): {net(rewards_i).item()}")
|
479
|
+
raise Exception("Stop here")
|
480
|
+
return np.mean(net(rewards_i).item())
|
481
481
|
|
482
482
|
|
483
483
|
# def compute_attention_reward(self, rewards):
|
@@ -0,0 +1,7 @@
|
|
1
|
+
gym_examples/__init__.py,sha256=ZTeyp0SinvYP9QhqAJgRCJyDVdSqynNlieriu3lweGA,166
|
2
|
+
gym_examples/envs/__init__.py,sha256=lgMe4pyOuUTgTBUddM0iwMlETsYTwFShny6ifm8PGM8,53
|
3
|
+
gym_examples/envs/wsn_env.py,sha256=Z0W7fcJ696BlqAUnRNoZi6Qg9tJcvBhLvv_UHGCJYOs,26980
|
4
|
+
gym_examples-3.0.759.dist-info/METADATA,sha256=zC4tuoN4KrjVHrfvi5ZCP5EYKmmv5CcXRvH_jQAZCfc,412
|
5
|
+
gym_examples-3.0.759.dist-info/WHEEL,sha256=2wepM1nk4DS4eFpYrW1TTqPcoGNfHhhO_i5m4cOimbo,92
|
6
|
+
gym_examples-3.0.759.dist-info/top_level.txt,sha256=rJRksoAF32M6lTLBEwYzRdo4PgtejceaNnnZ3HeY_Rk,13
|
7
|
+
gym_examples-3.0.759.dist-info/RECORD,,
|
@@ -1,7 +0,0 @@
|
|
1
|
-
gym_examples/__init__.py,sha256=wTbccbijA4S2bCClYZUAIV2wk4v8I02ORM5B8uPEouc,166
|
2
|
-
gym_examples/envs/__init__.py,sha256=lgMe4pyOuUTgTBUddM0iwMlETsYTwFShny6ifm8PGM8,53
|
3
|
-
gym_examples/envs/wsn_env.py,sha256=09K0IztE2cXxl9PChKgDaLVqPF2KNQ-Pav_h0PDdYNo,26947
|
4
|
-
gym_examples-3.0.757.dist-info/METADATA,sha256=-WQV4YWJ9pbVuWL4z_MnISbNBEm7pD-4jZjF_S-SNuA,412
|
5
|
-
gym_examples-3.0.757.dist-info/WHEEL,sha256=2wepM1nk4DS4eFpYrW1TTqPcoGNfHhhO_i5m4cOimbo,92
|
6
|
-
gym_examples-3.0.757.dist-info/top_level.txt,sha256=rJRksoAF32M6lTLBEwYzRdo4PgtejceaNnnZ3HeY_Rk,13
|
7
|
-
gym_examples-3.0.757.dist-info/RECORD,,
|
File without changes
|
File without changes
|