dreamer4 0.0.97__tar.gz → 0.0.99__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: dreamer4
3
- Version: 0.0.97
3
+ Version: 0.0.99
4
4
  Summary: Dreamer 4
5
5
  Project-URL: Homepage, https://pypi.org/project/dreamer4/
6
6
  Project-URL: Repository, https://github.com/lucidrains/dreamer4
@@ -2580,6 +2580,8 @@ class DynamicsWorldModel(Module):
2580
2580
  if self.pmpo_kl_div_loss_weight > 0.:
2581
2581
  new_unembedded_actions = self.action_embedder.unembed(policy_embed, pred_head_index = 0)
2582
2582
 
2583
+ # mentioned that the "reverse direction for the prior KL" was used
2584
+
2583
2585
  discrete_kl_div, continuous_kl_div = self.action_embedder.kl_div(old_action_unembeds, new_unembedded_actions)
2584
2586
 
2585
2587
  # accumulate discrete and continuous kl div
@@ -2868,7 +2870,7 @@ class DynamicsWorldModel(Module):
2868
2870
  # maybe store old actions
2869
2871
 
2870
2872
  if store_old_action_unembeds:
2871
- acc_policy_embed = safe_cat((acc_policy_embed, policy_embed))
2873
+ acc_policy_embed = safe_cat((acc_policy_embed, policy_embed), dim = 1)
2872
2874
 
2873
2875
  # sample actions
2874
2876
 
@@ -1,6 +1,6 @@
1
1
  [project]
2
2
  name = "dreamer4"
3
- version = "0.0.97"
3
+ version = "0.0.99"
4
4
  description = "Dreamer 4"
5
5
  authors = [
6
6
  { name = "Phil Wang", email = "lucidrains@gmail.com" }
File without changes
File without changes
File without changes
File without changes
File without changes