PyPI - gym-examples - Versions diffs - 3.0.748__py3-none-any.whl → 3.0.750__py3-none-any.whl - Mend

gym-examples 3.0.748py3-none-any.whl → 3.0.750py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (7) hide show

gym_examples/__init__.py CHANGED Viewed

@@ -5,4 +5,4 @@ register(
      entry_point="gym_examples.envs:WSNRoutingEnv",
 )
-__version__ = "3.0.748"
+__version__ = "3.0.750"

gym_examples/envs/wsn_env.py CHANGED Viewed

@@ -150,7 +150,7 @@ class WSNRoutingEnv(gym.Env):
         self.number_of_steps += 1
         self.steps += 1
         # rewards = [-max_reward] * self.n_sensors
-        reward_init = np.array([0] * input_dim)
+        reward_init = [0] * input_dim
         rewards = [reward_init] * self.n_sensors
         dones = [False] * self.n_sensors
         for i, action in enumerate(actions):
@@ -179,7 +179,7 @@ class WSNRoutingEnv(gym.Env):
                 self.total_latency += self.packet_latency[i] + latency_per_hop
                 self.packet_latency[i] = 0
-                rewards[i] = np.array([max_reward] * input_dim) # Reward for transmitting data to the base station
+                rewards[i] = [max_reward] * input_dim # Reward for transmitting data to the base station
                 dones[i] = True
             else:
                 distance = np.linalg.norm(self.sensor_positions[i] - self.sensor_positions[action])
@@ -225,10 +225,10 @@ class WSNRoutingEnv(gym.Env):
         self.get_metrics()
-        rewards = [reward.item() if isinstance(reward, torch.Tensor) else reward for reward in rewards] # Convert the reward to a float
+        # rewards = [reward.item() if isinstance(reward, torch.Tensor) else reward for reward in rewards] # Convert the reward to a float
-        rewards = self.compute_attention_reward(rewards)
-        rewards = np.mean(rewards)
+        rewards = self.compute_attention_rewards(rewards)
+        # rewards = np.mean(rewards)
         for i in range(self.n_sensors):
             if not dones[i]:
@@ -382,7 +382,7 @@ class WSNRoutingEnv(gym.Env):
         reward_dispersion_remaining_energy = self.compute_reward_dispersion_remaining_energy()
         reward_number_of_packets = self.compute_reward_number_of_packets(action)
-        rewards_energy = np.array([reward_angle, reward_consumption_energy, reward_dispersion_remaining_energy, reward_number_of_packets])
+        rewards_energy = [reward_angle, reward_consumption_energy, reward_dispersion_remaining_energy, reward_number_of_packets]
         #-- rewards related to the performance metrics
         reward_latency = self.compute_reward_latency()
@@ -390,7 +390,7 @@ class WSNRoutingEnv(gym.Env):
         reward_network_throughput = self.compute_reward_network_throughput()
         reward_packet_delivery_ratio = self.compute_reward_packet_delivery_ratio()
-        rewards_performance = np.array([reward_latency, reward_network_throughput, reward_packet_delivery_ratio])
+        rewards_performance = [reward_latency, reward_network_throughput, reward_packet_delivery_ratio]
         return rewards_energy
@@ -399,12 +399,12 @@ class WSNRoutingEnv(gym.Env):
         reward_consumption_energy = self.network_reward_consumption_energy()
         reward_dispersion_remaining_energy = self.network_reward_dispersion_remaining_energy()
-        rewards_energy = np.array([reward_consumption_energy, reward_dispersion_remaining_energy])
+        rewards_energy = [reward_consumption_energy, reward_dispersion_remaining_energy]
         reward_latency = self.compute_reward_latency()
         reward_network_throughput = self.compute_reward_network_throughput()
         reward_packet_delivery_ratio = self.compute_reward_packet_delivery_ratio()
-        rewards_performance = np.array([reward_latency, reward_network_throughput, reward_packet_delivery_ratio])
+        rewards_performance = [reward_latency, reward_network_throughput, reward_packet_delivery_ratio]
         return np.concatenate((rewards_energy, rewards_performance))
@@ -465,44 +465,45 @@ class WSNRoutingEnv(gym.Env):
         return np.clip(normalized_throughput, 0, 1)
-    # def compute_attention_rewards(self, rewards):
-    #     '''
-    #     Compute the attention-based rewards
-    #     '''
-    #     rewards = torch.tensor(rewards, dtype=torch.double)
-    #     final_reward = net(rewards)
-    #     return final_reward
+    def compute_attention_rewards(self, rewards):
+        '''
+        Compute the attention-based rewards
+        '''
+        rewards = torch.tensor(rewards, dtype=torch.double)
+        rewards = rewards.unsqueeze(0)  # Add batch dimension
+        final_reward = net(rewards)
+        return final_reward
-    def compute_attention_reward(self, rewards):
-        '''
-        Compute the attention-based reward for the network with Q, V, and K matrices
+    # def compute_attention_reward(self, rewards):
+    #     '''
+    #     Compute the attention-based reward for the network with Q, V, and K matrices
-        Input:
-                - rewards: list of rewards for each sensor
-        Output:
-                - final_reward: final reward for the network
-        '''
-        # dimension of the sensor embedding
-        d = len(rewards[0])
+    #     Input:
+    #             - rewards: list of rewards for each sensor
+    #     Output:
+    #             - final_reward: final reward for the network
+    #     '''
+    #     # dimension of the sensor embedding
+    #     d = len(rewards[0])
-        # All sensors are represented by their raw rewards
-        query_vector = np.array([max_reward] * d) # Basically, the target is the base station
+    #     # All sensors are represented by their raw rewards
+    #     query_vector = np.array([max_reward] * d) # Basically, the target is the base station
-        # Similarities between the query vector and the rewards
-        similarities = [np.dot(query_vector, reward) for reward in rewards]
+    #     # Similarities between the query vector and the rewards
+    #     similarities = [np.dot(query_vector, reward) for reward in rewards]
-        # Similarities scaling
-        similarities = [similarity / np.sqrt(d) for similarity in similarities]
+    #     # Similarities scaling
+    #     similarities = [similarity / np.sqrt(d) for similarity in similarities]
-        # Softmax operation
-        denominator = sum([np.exp(similarity) for similarity in similarities])
-        attention_weights = [np.exp(similarity) / denominator for similarity in similarities]
+    #     # Softmax operation
+    #     denominator = sum([np.exp(similarity) for similarity in similarities])
+    #     attention_weights = [np.exp(similarity) / denominator for similarity in similarities]
-        # Weighted sum of the rewards
-        final_reward = sum([attention_weight * reward for attention_weight, reward in zip(attention_weights, rewards)])
+    #     # Weighted sum of the rewards
+    #     final_reward = sum([attention_weight * reward for attention_weight, reward in zip(attention_weights, rewards)])
-        return final_reward
+    #     return final_reward
     def integrate_mobility(self):

{gym_examples-3.0.748.dist-info → gym_examples-3.0.750.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: gym-examples
-Version: 3.0.748
+Version: 3.0.750
 Summary: A custom environment for multi-agent reinforcement learning focused on WSN routing.
 Home-page: https://github.com/gedji/CODES.git
 Author: Georges Djimefo

gym_examples-3.0.750.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,7 @@
+gym_examples/__init__.py,sha256=qaPZA7Q93uDypjo58Stoco6cD-o4R03zzeYSCAE2JhU,166
+gym_examples/envs/__init__.py,sha256=lgMe4pyOuUTgTBUddM0iwMlETsYTwFShny6ifm8PGM8,53
+gym_examples/envs/wsn_env.py,sha256=8ne-Dm4xfoY-AYDyzOiZ1RjDtG6RjuWrXiiFQSix8Ac,26639
+gym_examples-3.0.750.dist-info/METADATA,sha256=LdlfRyDsFXXtHKkA1m-f2Gmb0_wXxb2dQPwpYuVD0OM,412
+gym_examples-3.0.750.dist-info/WHEEL,sha256=2wepM1nk4DS4eFpYrW1TTqPcoGNfHhhO_i5m4cOimbo,92
+gym_examples-3.0.750.dist-info/top_level.txt,sha256=rJRksoAF32M6lTLBEwYzRdo4PgtejceaNnnZ3HeY_Rk,13
+gym_examples-3.0.750.dist-info/RECORD,,

gym_examples-3.0.748.dist-info/RECORD DELETED Viewed

@@ -1,7 +0,0 @@
-gym_examples/__init__.py,sha256=eYYXxWIuq0ncCeOZlkOdiiSyvf-tuxzRHAPrh_PA3_c,166
-gym_examples/envs/__init__.py,sha256=lgMe4pyOuUTgTBUddM0iwMlETsYTwFShny6ifm8PGM8,53
-gym_examples/envs/wsn_env.py,sha256=MEp84-JlL4oPg0YTGl-PvVIOZdC4xi8cyBCfNkbtdDQ,26601
-gym_examples-3.0.748.dist-info/METADATA,sha256=j3_GmDZ2TiworAz03Jo9cnA5PrCbt1LlaBD5izqbJnU,412
-gym_examples-3.0.748.dist-info/WHEEL,sha256=2wepM1nk4DS4eFpYrW1TTqPcoGNfHhhO_i5m4cOimbo,92
-gym_examples-3.0.748.dist-info/top_level.txt,sha256=rJRksoAF32M6lTLBEwYzRdo4PgtejceaNnnZ3HeY_Rk,13
-gym_examples-3.0.748.dist-info/RECORD,,

{gym_examples-3.0.748.dist-info → gym_examples-3.0.750.dist-info}/WHEEL RENAMED Viewed

File without changes

{gym_examples-3.0.748.dist-info → gym_examples-3.0.750.dist-info}/top_level.txt RENAMED Viewed

File without changes

gym-examples 3.0.748__py3-none-any.whl → 3.0.750__py3-none-any.whl

gym-examples 3.0.748py3-none-any.whl → 3.0.750py3-none-any.whl