metacontroller-pytorch 0.0.15__py3-none-any.whl → 0.0.16__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- metacontroller/metacontroller.py +8 -1
- {metacontroller_pytorch-0.0.15.dist-info → metacontroller_pytorch-0.0.16.dist-info}/METADATA +2 -2
- metacontroller_pytorch-0.0.16.dist-info/RECORD +6 -0
- metacontroller_pytorch-0.0.15.dist-info/RECORD +0 -6
- {metacontroller_pytorch-0.0.15.dist-info → metacontroller_pytorch-0.0.16.dist-info}/WHEEL +0 -0
- {metacontroller_pytorch-0.0.15.dist-info → metacontroller_pytorch-0.0.16.dist-info}/licenses/LICENSE +0 -0
metacontroller/metacontroller.py
CHANGED
|
@@ -308,7 +308,8 @@ class Transformer(Module):
|
|
|
308
308
|
|
|
309
309
|
# handle maybe behavioral cloning
|
|
310
310
|
|
|
311
|
-
if behavioral_cloning:
|
|
311
|
+
if behavioral_cloning or (meta_controlling and discovery_phase):
|
|
312
|
+
|
|
312
313
|
state, target_state = state[:, :-1], state[:, 1:]
|
|
313
314
|
action_ids, target_action_ids = action_ids[:, :-1], action_ids[:, 1:]
|
|
314
315
|
|
|
@@ -352,6 +353,12 @@ class Transformer(Module):
|
|
|
352
353
|
|
|
353
354
|
return state_clone_loss, action_clone_loss
|
|
354
355
|
|
|
356
|
+
elif meta_controlling and discovery_phase:
|
|
357
|
+
|
|
358
|
+
action_recon_loss = self.action_readout.calculate_loss(dist_params, target_action_ids)
|
|
359
|
+
|
|
360
|
+
return action_recon_loss, next_meta_hiddens.kl_loss
|
|
361
|
+
|
|
355
362
|
# returning
|
|
356
363
|
|
|
357
364
|
return_one = not (return_latents or return_cache)
|
{metacontroller_pytorch-0.0.15.dist-info → metacontroller_pytorch-0.0.16.dist-info}/METADATA
RENAMED
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: metacontroller-pytorch
|
|
3
|
-
Version: 0.0.
|
|
3
|
+
Version: 0.0.16
|
|
4
4
|
Summary: Transformer Metacontroller
|
|
5
5
|
Project-URL: Homepage, https://pypi.org/project/metacontroller/
|
|
6
6
|
Project-URL: Repository, https://github.com/lucidrains/metacontroller
|
|
@@ -60,7 +60,7 @@ Implementation of the MetaController proposed in [Emergent temporal abstractions
|
|
|
60
60
|
@misc{kobayashi2025emergenttemporalabstractionsautoregressive,
|
|
61
61
|
title = {Emergent temporal abstractions in autoregressive models enable hierarchical reinforcement learning},
|
|
62
62
|
author = {Seijin Kobayashi and Yanick Schimpf and Maximilian Schlegel and Angelika Steger and Maciej Wolczyk and Johannes von Oswald and Nino Scherrer and Kaitlin Maile and Guillaume Lajoie and Blake A. Richards and Rif A. Saurous and James Manyika and Blaise Agüera y Arcas and Alexander Meulemans and João Sacramento},
|
|
63
|
-
year={2025},
|
|
63
|
+
year = {2025},
|
|
64
64
|
eprint = {2512.20605},
|
|
65
65
|
archivePrefix = {arXiv},
|
|
66
66
|
primaryClass = {cs.LG},
|
|
@@ -0,0 +1,6 @@
|
|
|
1
|
+
metacontroller/__init__.py,sha256=lj7IOGpN--qMxJWbB-4SGqoPXG7Hd4mgtToTRSyTZ58,57
|
|
2
|
+
metacontroller/metacontroller.py,sha256=BT7GH8F9NkEIYLEueBkkZ8glQ3Oht1FRoV84SIaTWdQ,11878
|
|
3
|
+
metacontroller_pytorch-0.0.16.dist-info/METADATA,sha256=eyECb3994X58zyExLnnffMl3pOoMlIb-WAUhepIt0r8,3741
|
|
4
|
+
metacontroller_pytorch-0.0.16.dist-info/WHEEL,sha256=WLgqFyCfm_KASv4WHyYy0P3pM_m7J5L9k2skdKLirC8,87
|
|
5
|
+
metacontroller_pytorch-0.0.16.dist-info/licenses/LICENSE,sha256=1yCiA9b5nhslTavxPjsQAO-wpOnwJR9-l8LTVi7GJuk,1066
|
|
6
|
+
metacontroller_pytorch-0.0.16.dist-info/RECORD,,
|
|
@@ -1,6 +0,0 @@
|
|
|
1
|
-
metacontroller/__init__.py,sha256=lj7IOGpN--qMxJWbB-4SGqoPXG7Hd4mgtToTRSyTZ58,57
|
|
2
|
-
metacontroller/metacontroller.py,sha256=ug3xeMTZKApTF8oOPx9hWypeDjRflf1IJp8RiysXgTo,11618
|
|
3
|
-
metacontroller_pytorch-0.0.15.dist-info/METADATA,sha256=9d39BpcuVeOVVSD66lCVHCK1GjrkeKzRtxKOPOc-7xQ,3736
|
|
4
|
-
metacontroller_pytorch-0.0.15.dist-info/WHEEL,sha256=WLgqFyCfm_KASv4WHyYy0P3pM_m7J5L9k2skdKLirC8,87
|
|
5
|
-
metacontroller_pytorch-0.0.15.dist-info/licenses/LICENSE,sha256=1yCiA9b5nhslTavxPjsQAO-wpOnwJR9-l8LTVi7GJuk,1066
|
|
6
|
-
metacontroller_pytorch-0.0.15.dist-info/RECORD,,
|
|
File without changes
|
{metacontroller_pytorch-0.0.15.dist-info → metacontroller_pytorch-0.0.16.dist-info}/licenses/LICENSE
RENAMED
|
File without changes
|