PyPI - torchrl-nightly - Versions diffs - 2025.8.8__cp312-cp312-manylinux1_x86_64.whl → 2025.8.10__cp312-cp312-manylinux1_x86_64.whl - Mend

torchrl-nightly 2025.8.8__cp312-cp312-manylinux1_x86_64.whl → 2025.8.10__cp312-cp312-manylinux1_x86_64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (85) hide show

benchmarks/ecosystem/vmas_rllib_vs_torchrl_sampling_performance.py +1 -2
sota-implementations/grpo/grpo_utils.py +2 -1
sota-implementations/redq/utils.py +2 -1
torchrl/_torchrl.cpython-312-x86_64-linux-gnu.so +0 -0
torchrl/_utils.py +2 -1
torchrl/collectors/collectors.py +2 -1
torchrl/collectors/distributed/generic.py +3 -1
torchrl/collectors/distributed/ray.py +3 -1
torchrl/collectors/distributed/rpc.py +3 -1
torchrl/collectors/distributed/sync.py +3 -1
torchrl/collectors/llm/base.py +2 -1
torchrl/collectors/llm/ray_collector.py +2 -1
torchrl/collectors/utils.py +1 -1
torchrl/collectors/weight_update.py +2 -1
torchrl/data/datasets/atari_dqn.py +1 -1
torchrl/data/datasets/common.py +1 -1
torchrl/data/datasets/d4rl.py +1 -1
torchrl/data/datasets/minari_data.py +1 -1
torchrl/data/datasets/openml.py +1 -1
torchrl/data/datasets/openx.py +2 -1
torchrl/data/datasets/roboset.py +1 -1
torchrl/data/datasets/vd4rl.py +1 -1
torchrl/data/llm/dataset.py +1 -1
torchrl/data/map/hash.py +1 -1
torchrl/data/map/query.py +4 -2
torchrl/data/map/tdstorage.py +2 -1
torchrl/data/map/tree.py +2 -1
torchrl/data/map/utils.py +1 -1
torchrl/data/replay_buffers/ray_buffer.py +2 -1
torchrl/data/replay_buffers/replay_buffers.py +2 -1
torchrl/data/replay_buffers/scheduler.py +2 -1
torchrl/data/replay_buffers/storages.py +2 -1
torchrl/data/replay_buffers/utils.py +2 -1
torchrl/data/replay_buffers/writers.py +2 -1
torchrl/data/tensor_specs.py +8 -19
torchrl/data/utils.py +3 -2
torchrl/envs/async_envs.py +2 -1
torchrl/envs/batched_envs.py +2 -1
torchrl/envs/common.py +2 -1
torchrl/envs/custom/llm.py +1 -1
torchrl/envs/env_creator.py +1 -1
torchrl/envs/gym_like.py +2 -1
torchrl/envs/libs/dm_control.py +2 -2
torchrl/envs/libs/gym.py +2 -3
torchrl/envs/libs/meltingpot.py +1 -1
torchrl/envs/libs/pettingzoo.py +2 -3
torchrl/envs/libs/smacv2.py +8 -10
torchrl/envs/llm/chat.py +3 -1
torchrl/envs/llm/datasets/gsm8k.py +2 -1
torchrl/envs/llm/datasets/ifeval.py +3 -1
torchrl/envs/llm/envs.py +2 -1
torchrl/envs/llm/reward/ifeval/_instructions.py +3 -2
torchrl/envs/llm/reward/ifeval/_instructions_util.py +1 -1
torchrl/envs/llm/reward/ifeval/_scorer.py +1 -1
torchrl/envs/llm/transforms/dataloading.py +2 -2
torchrl/envs/llm/transforms/reason.py +2 -1
torchrl/envs/llm/transforms/tokenizer.py +1 -1
torchrl/envs/transforms/transforms.py +3 -10
torchrl/envs/transforms/vecnorm.py +3 -1
torchrl/modules/distributions/continuous.py +1 -1
torchrl/modules/distributions/discrete.py +2 -1
torchrl/modules/models/exploration.py +1 -1
torchrl/modules/models/models.py +1 -1
torchrl/modules/models/multiagent.py +1 -1
torchrl/modules/models/utils.py +1 -1
torchrl/modules/tensordict_module/actors.py +1 -1
torchrl/modules/tensordict_module/common.py +1 -1
torchrl/objectives/common.py +1 -1
torchrl/objectives/ppo.py +1 -1
torchrl/objectives/utils.py +2 -1
torchrl/objectives/value/advantages.py +1 -1
torchrl/record/loggers/common.py +1 -1
torchrl/record/loggers/csv.py +1 -1
torchrl/record/loggers/mlflow.py +2 -1
torchrl/record/loggers/tensorboard.py +1 -1
torchrl/record/loggers/wandb.py +1 -1
torchrl/record/recorder.py +1 -1
torchrl/trainers/helpers/collectors.py +3 -1
torchrl/trainers/helpers/envs.py +14 -13
torchrl/trainers/trainers.py +5 -4
{torchrl_nightly-2025.8.8.dist-info → torchrl_nightly-2025.8.10.dist-info}/METADATA +1 -1
{torchrl_nightly-2025.8.8.dist-info → torchrl_nightly-2025.8.10.dist-info}/RECORD +85 -85
{torchrl_nightly-2025.8.8.dist-info → torchrl_nightly-2025.8.10.dist-info}/WHEEL +0 -0
{torchrl_nightly-2025.8.8.dist-info → torchrl_nightly-2025.8.10.dist-info}/licenses/LICENSE +0 -0
{torchrl_nightly-2025.8.8.dist-info → torchrl_nightly-2025.8.10.dist-info}/top_level.txt +0 -0

torchrl/envs/libs/smacv2.py CHANGED Viewed

@@ -5,8 +5,6 @@
 import importlib
 import re
-from typing import Dict, Optional
 import torch
 from tensordict import TensorDict, TensorDictBase
@@ -196,7 +194,7 @@ class SMACv2Wrapper(_EnvWrapper):
         return smacv2
-    def _check_kwargs(self, kwargs: Dict):
+    def _check_kwargs(self, kwargs: dict):
         import smacv2
         if "env" not in kwargs:
@@ -311,7 +309,7 @@ class SMACv2Wrapper(_EnvWrapper):
         )
         return spec
-    def _set_seed(self, seed: Optional[int]) -> None:
+    def _set_seed(self, seed: int | None) -> None:
         if seed is not None:
             raise NotImplementedError(
                 "Seed cannot be changed once environment was created."
@@ -329,7 +327,7 @@ class SMACv2Wrapper(_EnvWrapper):
         return torch.tensor(value, device=self.device, dtype=torch.float32)
     def _reset(
-        self, tensordict: Optional[TensorDictBase] = None, **kwargs
+        self, tensordict: TensorDictBase | None = None, **kwargs
     ) -> TensorDictBase:
         obs, state = self._env.reset()
@@ -602,8 +600,8 @@ class SMACv2Env(SMACv2Wrapper):
     def __init__(
         self,
         map_name: str,
-        capability_config: Optional[Dict] = None,
-        seed: Optional[int] = None,
+        capability_config: dict | None = None,
+        seed: int | None = None,
         categorical_actions: bool = True,
         **kwargs,
     ):
@@ -619,15 +617,15 @@ class SMACv2Env(SMACv2Wrapper):
         super().__init__(**kwargs)
-    def _check_kwargs(self, kwargs: Dict):
+    def _check_kwargs(self, kwargs: dict):
         if "map_name" not in kwargs:
             raise TypeError("Expected 'map_name' to be part of kwargs")
     def _build_env(
         self,
         map_name: str,
-        capability_config: Optional[Dict] = None,
-        seed: Optional[int] = None,
+        capability_config: dict | None = None,
+        seed: int | None = None,
         **kwargs,
     ) -> "smacv2.env.StarCraft2Env":  # noqa: F821
         import smacv2.env

torchrl/envs/llm/chat.py CHANGED Viewed

@@ -4,7 +4,9 @@
 # LICENSE file in the root directory of this source tree.
 from __future__ import annotations
-from typing import Any, Callable, Literal, TYPE_CHECKING
+from collections.abc import Callable
+from typing import Any, Literal, TYPE_CHECKING
 import torch
 from tensordict import lazy_stack, TensorDictBase

torchrl/envs/llm/datasets/gsm8k.py CHANGED Viewed

@@ -5,7 +5,8 @@
 from __future__ import annotations
 import warnings
-from typing import Any, Callable, Literal, TYPE_CHECKING
+from collections.abc import Callable
+from typing import Any, Literal, TYPE_CHECKING
 import torch
 from tensordict import NestedKey, TensorDict, TensorDictBase

torchrl/envs/llm/datasets/ifeval.py CHANGED Viewed

@@ -4,7 +4,9 @@
 # LICENSE file in the root directory of this source tree.
 from __future__ import annotations
-from typing import Any, Callable, Literal, TYPE_CHECKING
+from collections.abc import Callable
+from typing import Any, Literal, TYPE_CHECKING
 import torch
 from tensordict import NonTensorData, NonTensorStack, TensorClass, TensorDict

torchrl/envs/llm/envs.py CHANGED Viewed

@@ -5,8 +5,9 @@
 from __future__ import annotations
 import warnings
+from collections.abc import Callable
-from typing import Any, Callable, Literal, TYPE_CHECKING
+from typing import Any, Literal, TYPE_CHECKING
 import torch

torchrl/envs/llm/reward/ifeval/_instructions.py CHANGED Viewed

@@ -36,7 +36,8 @@ import json
 import random
 import re
 import string
-from typing import Any, Dict, Literal, Optional, Sequence, Union
+from collections.abc import Sequence
+from typing import Any, Literal, Optional, Union
 from torchrl._utils import logger as torchrl_logger
@@ -50,7 +51,7 @@ from ._instructions_util import (
 )
-_InstructionArgsDtype = Optional[Dict[str, Union[int, str, Sequence[str]]]]
+_InstructionArgsDtype = Optional[dict[str, Union[int, str, Sequence[str]]]]
 _LANGUAGES = LANGUAGE_CODES

torchrl/envs/llm/reward/ifeval/_instructions_util.py CHANGED Viewed

@@ -1660,7 +1660,7 @@ def count_words(text):
     return num_words
-@functools.lru_cache(maxsize=None)
+@functools.cache
 def _get_sentence_tokenizer():
     return nltk.data.load("nltk:tokenizers/punkt/english.pickle")

torchrl/envs/llm/reward/ifeval/_scorer.py CHANGED Viewed

@@ -17,7 +17,7 @@ from __future__ import annotations
 import importlib.util
 import re
-from typing import Callable
+from collections.abc import Callable
 import torch
 from tensordict import (

torchrl/envs/llm/transforms/dataloading.py CHANGED Viewed

@@ -6,8 +6,8 @@ from __future__ import annotations
 import warnings
 from collections import deque
-from collections.abc import Mapping
-from typing import Any, Callable, Iterable, Literal
+from collections.abc import Callable, Iterable, Mapping
+from typing import Any, Literal
 import torch
 from tensordict import is_tensor_collection, lazy_stack, TensorDict, TensorDictBase

torchrl/envs/llm/transforms/reason.py CHANGED Viewed

@@ -6,7 +6,8 @@
 from __future__ import annotations
 import re
-from typing import Callable, Literal
+from collections.abc import Callable
+from typing import Literal
 from tensordict import lazy_stack, TensorDictBase
 from torchrl._utils import logger as torchrl_logger

torchrl/envs/llm/transforms/tokenizer.py CHANGED Viewed

@@ -5,7 +5,7 @@
 from __future__ import annotations
-from typing import Sequence
+from collections.abc import Sequence
 import torch
 from tensordict import NonTensorData, NonTensorStack, TensorDictBase

torchrl/envs/transforms/transforms.py CHANGED Viewed

@@ -14,20 +14,13 @@ import multiprocessing as mp
 import time
 import warnings
 import weakref
+from collections import OrderedDict
+from collections.abc import Callable, Mapping, Sequence
 from copy import copy
 from enum import IntEnum
 from functools import wraps
 from textwrap import indent
-from typing import (
-    Any,
-    Callable,
-    Mapping,
-    OrderedDict,
-    Sequence,
-    TYPE_CHECKING,
-    TypeVar,
-    Union,
-)
+from typing import Any, TYPE_CHECKING, TypeVar, Union
 import numpy as np

torchrl/envs/transforms/vecnorm.py CHANGED Viewed

@@ -7,9 +7,11 @@ from __future__ import annotations
 import math
 import uuid
 import warnings
+from collections import OrderedDict
+from collections.abc import Sequence
 from copy import copy
-from typing import Any, OrderedDict, Sequence
+from typing import Any
 import torch
 from tensordict import NestedKey, TensorDict, TensorDictBase, unravel_key

torchrl/modules/distributions/continuous.py CHANGED Viewed

@@ -5,8 +5,8 @@
 from __future__ import annotations
 import weakref
+from collections.abc import Sequence
 from numbers import Number
-from typing import Sequence
 import numpy as np
 import torch

torchrl/modules/distributions/discrete.py CHANGED Viewed

@@ -4,9 +4,10 @@
 # LICENSE file in the root directory of this source tree.
 from __future__ import annotations
+from collections.abc import Sequence
 from enum import Enum
 from functools import wraps
-from typing import Sequence
 import torch
 import torch.distributions as D

torchrl/modules/models/exploration.py CHANGED Viewed

@@ -7,7 +7,7 @@ from __future__ import annotations
 import functools
 import math
 import warnings
-from typing import Sequence
+from collections.abc import Sequence
 import torch
 from tensordict.nn import TensorDictModuleBase

torchrl/modules/models/models.py CHANGED Viewed

@@ -5,9 +5,9 @@
 from __future__ import annotations
 import dataclasses
+from collections.abc import Callable, Sequence
 from copy import deepcopy
 from numbers import Number
-from typing import Callable, Sequence
 import torch
 from torch import nn

torchrl/modules/models/multiagent.py CHANGED Viewed

@@ -5,9 +5,9 @@
 from __future__ import annotations
 import abc
+from collections.abc import Sequence
 from copy import deepcopy
 from textwrap import indent
-from typing import Sequence
 import numpy as np
 import torch

torchrl/modules/models/utils.py CHANGED Viewed

@@ -6,7 +6,7 @@ from __future__ import annotations
 import inspect
 import warnings
-from typing import Callable, Sequence
+from collections.abc import Callable, Sequence
 import torch
 from torch import nn

torchrl/modules/tensordict_module/actors.py CHANGED Viewed

@@ -4,7 +4,7 @@
 # LICENSE file in the root directory of this source tree.
 from __future__ import annotations
-from typing import Sequence
+from collections.abc import Sequence
 import torch
 from tensordict import TensorDictBase, unravel_key

torchrl/modules/tensordict_module/common.py CHANGED Viewed

@@ -9,7 +9,7 @@ import importlib.util
 import inspect
 import re
 import warnings
-from typing import Iterable
+from collections.abc import Iterable
 import torch
 from tensordict import TensorDictBase, unravel_key_list

torchrl/objectives/common.py CHANGED Viewed

@@ -8,9 +8,9 @@ from __future__ import annotations
 import abc
 import functools
 import warnings
+from collections.abc import Iterator
 from copy import deepcopy
 from dataclasses import dataclass
-from typing import Iterator
 import torch
 from tensordict import is_tensor_collection, TensorDict, TensorDictBase

torchrl/objectives/ppo.py CHANGED Viewed

@@ -6,9 +6,9 @@ from __future__ import annotations
 import contextlib
 import warnings
+from collections.abc import Mapping
 from copy import deepcopy
 from dataclasses import dataclass
-from typing import Mapping
 import torch
 from tensordict import (

torchrl/objectives/utils.py CHANGED Viewed

@@ -7,9 +7,10 @@ from __future__ import annotations
 import functools
 import re
 import warnings
+from collections.abc import Callable, Iterable
 from copy import copy
 from enum import Enum
-from typing import Any, Callable, Iterable, TypeVar
+from typing import Any, TypeVar
 import torch
 from tensordict import NestedKey, TensorDict, TensorDictBase, unravel_key

torchrl/objectives/value/advantages.py CHANGED Viewed

@@ -7,10 +7,10 @@ from __future__ import annotations
 import abc
 import functools
 import warnings
+from collections.abc import Callable
 from contextlib import nullcontext
 from dataclasses import asdict, dataclass
 from functools import wraps
-from typing import Callable
 import torch
 from tensordict import is_tensor_collection, TensorDictBase

torchrl/record/loggers/common.py CHANGED Viewed

@@ -5,7 +5,7 @@
 from __future__ import annotations
 import abc
-from typing import Sequence
+from collections.abc import Sequence
 from torch import Tensor

torchrl/record/loggers/csv.py CHANGED Viewed

@@ -6,8 +6,8 @@ from __future__ import annotations
 import os
 from collections import defaultdict
+from collections.abc import Sequence
 from pathlib import Path
-from typing import Sequence
 import tensordict.utils
 import torch

torchrl/record/loggers/mlflow.py CHANGED Viewed

@@ -7,8 +7,9 @@ from __future__ import annotations
 import importlib.util
 import os
+from collections.abc import Sequence
 from tempfile import TemporaryDirectory
-from typing import Any, Sequence
+from typing import Any
 from torch import Tensor

torchrl/record/loggers/tensorboard.py CHANGED Viewed

@@ -7,7 +7,7 @@ from __future__ import annotations
 import importlib.util
 import os
-from typing import Sequence
+from collections.abc import Sequence
 from torch import Tensor

torchrl/record/loggers/wandb.py CHANGED Viewed

@@ -7,7 +7,7 @@ from __future__ import annotations
 import importlib.util
 import os
-from typing import Sequence
+from collections.abc import Sequence
 from torch import Tensor

torchrl/record/recorder.py CHANGED Viewed

@@ -6,8 +6,8 @@ from __future__ import annotations
 import importlib.util
 import math
+from collections.abc import Callable, Sequence
 from copy import copy
-from typing import Callable, Sequence
 import numpy as np
 import torch

torchrl/trainers/helpers/collectors.py CHANGED Viewed

@@ -4,8 +4,10 @@
 # LICENSE file in the root directory of this source tree.
 from __future__ import annotations
+from collections.abc import Callable
 from dataclasses import dataclass, field
-from typing import Any, Callable
+from typing import Any
 from tensordict import TensorDictBase

torchrl/trainers/helpers/envs.py CHANGED Viewed

@@ -8,9 +8,10 @@
 # from __future__ import annotations
 import importlib.util
+from collections.abc import Callable, Sequence
 from copy import copy
 from dataclasses import dataclass, field as dataclass_field
-from typing import Any, Callable, Optional, Sequence, Union
+from typing import Any
 import torch
 from torchrl._utils import logger as torchrl_logger, VERBOSE
@@ -223,18 +224,18 @@ def get_norm_state_dict(env):
 def transformed_env_constructor(
     cfg: DictConfig,  # noqa: F821
     video_tag: str = "",
-    logger: Optional[Logger] = None,  # noqa
-    stats: Optional[dict] = None,
+    logger: Logger | None = None,  # noqa
+    stats: dict | None = None,
     norm_obs_only: bool = False,
     use_env_creator: bool = False,
-    custom_env_maker: Optional[Callable] = None,
-    custom_env: Optional[EnvBase] = None,
+    custom_env_maker: Callable | None = None,
+    custom_env: EnvBase | None = None,
     return_transformed_envs: bool = True,
-    action_dim_gsde: Optional[int] = None,
-    state_dim_gsde: Optional[int] = None,
-    batch_dims: Optional[int] = 0,
-    obs_norm_state_dict: Optional[dict] = None,
-) -> Union[Callable, EnvCreator]:
+    action_dim_gsde: int | None = None,
+    state_dim_gsde: int | None = None,
+    batch_dims: int | None = 0,
+    obs_norm_state_dict: dict | None = None,
+) -> Callable | EnvCreator:
     """Returns an environment creator from an argparse.Namespace built with the appropriate parser constructor.
     Args:
@@ -340,7 +341,7 @@ def transformed_env_constructor(
 def parallel_env_constructor(
     cfg: DictConfig, **kwargs  # noqa: F821
-) -> Union[ParallelEnv, EnvCreator]:
+) -> ParallelEnv | EnvCreator:
     """Returns a parallel environment from an argparse.Namespace built with the appropriate parser constructor.
     Args:
@@ -385,7 +386,7 @@ def parallel_env_constructor(
 def get_stats_random_rollout(
     cfg: DictConfig,  # noqa: F821
     proof_environment: EnvBase = None,
-    key: Optional[str] = None,
+    key: str | None = None,
 ):
     """Gathers stas (loc and scale) from an environment using random rollouts.
@@ -463,7 +464,7 @@ def get_stats_random_rollout(
 def initialize_observation_norm_transforms(
     proof_environment: EnvBase,
     num_iter: int = 1000,
-    key: Union[str, tuple[str, ...]] = None,
+    key: str | tuple[str, ...] = None,
 ):
     """Calls :obj:`ObservationNorm.init_stats` on all uninitialized :obj:`ObservationNorm` instances of a :obj:`TransformedEnv`.

torchrl/trainers/trainers.py CHANGED Viewed

@@ -9,9 +9,10 @@ import abc
 import pathlib
 import warnings
 from collections import defaultdict, OrderedDict
+from collections.abc import Callable, Sequence
 from copy import deepcopy
 from textwrap import indent
-from typing import Any, Callable, Sequence, Tuple
+from typing import Any
 import numpy as np
 import torch.nn
@@ -362,19 +363,19 @@ class Trainer:
         elif dest == "pre_steps_log":
             _check_input_output_typehint(
-                op, input=TensorDictBase, output=Tuple[str, float]
+                op, input=TensorDictBase, output=tuple[str, float]
             )
             self._pre_steps_log_ops.append((op, kwargs))
         elif dest == "post_steps_log":
             _check_input_output_typehint(
-                op, input=TensorDictBase, output=Tuple[str, float]
+                op, input=TensorDictBase, output=tuple[str, float]
             )
             self._post_steps_log_ops.append((op, kwargs))
         elif dest == "post_optim_log":
             _check_input_output_typehint(
-                op, input=TensorDictBase, output=Tuple[str, float]
+                op, input=TensorDictBase, output=tuple[str, float]
             )
             self._post_optim_log_ops.append((op, kwargs))

{torchrl_nightly-2025.8.8.dist-info → torchrl_nightly-2025.8.10.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: torchrl-nightly
-Version: 2025.8.8
+Version: 2025.8.10
 Summary: A modular, primitive-first, python-first PyTorch library for Reinforcement Learning
 Author-email: torchrl contributors <vmoens@fb.com>
 Maintainer-email: torchrl contributors <vmoens@fb.com>