Update

Vincent Moens · Vincent Moens · commit e43b3fe1cefb · 2025-03-17T21:19:22.000-07:00
[ghstack-poisoned]
diff --git a/tensordict/_lazy.py b/tensordict/_lazy.py
@@ -34,6 +34,7 @@
 import torch
 
 from tensordict.memmap import MemoryMappedTensor
+from torch.nn.utils.rnn import pad_sequence
 
 try:
     from functorch import dim as ftdim
@@ -516,7 +517,7 @@ def get_item_shape(self, key):
             return item.shape
         except RuntimeError as err:
             if re.match(
-                r"Found more than one unique shape in the tensors|Could not run 'aten::stack' with arguments from the",
+                r"Failed to stack tensors within a tensordict",
                 str(err),
             ):
                 shape = None
@@ -1057,11 +1058,87 @@ def _maybe_get_list(self, key):
             vals.append(val)
         return vals
 
+    def get(
+        self,
+        key: NestedKey,
+        *args,
+        as_list: bool = False,
+        as_padded_tensor: bool = False,
+        as_nested_tensor: bool = False,
+        padding_side: str = "right",
+        layout: torch.layout = None,
+        padding_value: float | int | bool = 0.0,
+        **kwargs,
+    ) -> CompatibleType:
+        """Gets the value stored with the input key.
+
+        Args:
+            key (str, tuple of str): key to be queried. If tuple of str it is
+                equivalent to chained calls of getattr.
+            default: default value if the key is not found in the tensordict. Defaults to ``None``.
+
+                .. warning::
+                    Previously, if a key was not present in the tensordict and no default
+                    was passed, a `KeyError` was raised. From v0.7, this behaviour has been changed
+                    and a `None` value is returned instead (in accordance with the what dict.get behavior).
+                    To adopt the old behavior, set the environment variable `export TD_GET_DEFAULTS_TO_NONE='0'` or call
+                    :func`~tensordict.set_get_defaults_to_none(False)`.
+
+        Keyword Args:
+            as_list (bool, optional): if ``True``, ragged tensors will be returned as list.
+                Exclusive with `as_padded_tensor` and `as_nested_tensor`.
+                Defaults to ``False``.
+            as_padded_tensor (bool, optional):  if ``True``, ragged tensors will be returned as padded tensors.
+                The padding value can be controlled via the `padding_value` keyword argument, and the padding
+                side via the `padding_side` argument.
+                Exclusive with `as_list` and `as_nested_tensor`.
+                Defaults to ``False``.
+            as_nested_tensor (bool, optional): if ``True``, ragged tensors will be returned as list.
+                Exclusive with `as_list` and `as_padded_tensor`.
+                The layout can be controlled via the `torch.layout` argument.
+                Defaults to ``False``.
+            layout (torch.layout, optional): the layout when `as_nested_tensor=True`.
+            padding_side (str): The side of padding. Must be `"left"` or `"right"`. Defaults to `"right"`.
+            padding_value (scalar or bool, optional): The padding value. Defaults to 0.0.
+
+        Examples:
+            >>> from tensordict import TensorDict, lazy_stack
+            >>> import torch
+            >>> td = lazy_stack([
+            ...     TensorDict({"x": torch.ones(1,)}),
+            ...     TensorDict({"x": torch.ones(2,) * 2}),
+            ... ])
+            >>> td.get("x", as_nested_tensor=True)
+            NestedTensor(size=(2, j1), offsets=tensor([0, 1, 3]), contiguous=True)
+            >>> td.get("x", as_padded_tensor=True)
+            tensor([[1., 0.],
+                    [2., 2.]])
+
+        """
+        return super().get(
+            key,
+            *args,
+            as_list=as_list,
+            as_padded_tensor=as_padded_tensor,
+            as_nested_tensor=as_nested_tensor,
+            padding_side=padding_side,
+            layout=layout,
+            padding_value=padding_value,
+            **kwargs,
+        )
+
     @cache  # noqa: B019
     def _get_str(
         self,
         key: NestedKey,
         default: Any = NO_DEFAULT,
+        *,
+        as_list: bool = False,
+        as_padded_tensor: bool = False,
+        as_nested_tensor: bool = False,
+        padding_side: str = "right",
+        layout: torch.layout = None,
+        padding_value: float | int | bool = 0.0,
     ) -> CompatibleType:
         # we can handle the case where the key is a tuple of length 1
         tensors = []
@@ -1076,7 +1153,15 @@ def _get_str(
                 return default
         try:
             out = self.lazy_stack(
-                tensors, self.stack_dim, stack_dim_name=self._td_dim_name
+                tensors,
+                self.stack_dim,
+                stack_dim_name=self._td_dim_name,
+                as_list=as_list,
+                as_padded_tensor=as_padded_tensor,
+                as_nested_tensor=as_nested_tensor,
+                padding_side=padding_side,
+                layout=layout,
+                padding_value=padding_value,
             )
             if _is_tensor_collection(type(out)):
                 if isinstance(out, LazyStackedTensorDict):
@@ -1118,8 +1203,8 @@ def _get_str(
             else:
                 raise err
 
-    def _get_tuple(self, key, default):
-        first = self._get_str(key[0], None)
+    def _get_tuple(self, key, default, **kwargs):
+        first = self._get_str(key[0], None, **kwargs)
         if first is None:
             return self._default_get(key[0], default)
         if len(key) == 1:
@@ -1130,7 +1215,7 @@ def _get_tuple(self, key, default):
                     raise ValueError(f"Got too many keys for a KJT: {key}.")
                 return first[key[-1]]
             else:
-                return first._get_tuple(key[1:], default=default)
+                return first._get_tuple(key[1:], default=default, **kwargs)
         except AttributeError as err:
             if "has no attribute" in str(err):
                 raise ValueError(
@@ -1148,6 +1233,12 @@ def lazy_stack(
         out: T | None = None,
         stack_dim_name: str | None = None,
         strict_shape: bool = False,
+        as_list: bool = False,
+        as_padded_tensor: bool = False,
+        as_nested_tensor: bool = False,
+        padding_side: str = "right",
+        layout: torch.layout | None = None,
+        padding_value: float | int | bool = 0.0,
     ) -> T:  # noqa: D417
         """Stacks tensordicts in a LazyStackedTensorDict.
 
@@ -1164,13 +1255,55 @@ def lazy_stack(
             stack_dim_name (str, optional): a name for the stacked dimension.
             strict_shape (bool, optional): if ``True``, every tensordict's shapes must match.
                 Defaults to ``False``.
+            as_list (bool, optional): if ``True``, ragged tensors will be returned as list.
+                Exclusive with `as_padded_tensor` and `as_nested_tensor`.
+                Defaults to ``False``.
+            as_padded_tensor (bool, optional):  if ``True``, ragged tensors will be returned as padded tensors.
+                The padding value can be controlled via the `padding_value` keyword argument, and the padding
+                side via the `padding_side` argument.
+                Exclusive with `as_list` and `as_nested_tensor`.
+                Defaults to ``False``.
+            as_nested_tensor (bool, optional): if ``True``, ragged tensors will be returned as list.
+                Exclusive with `as_list` and `as_padded_tensor`.
+                The layout can be controlled via the `torch.layout` argument.
+                Defaults to ``False``.
+            layout (torch.layout, optional): the layout when `as_nested_tensor=True`.
+            padding_side (str): The side of padding. Must be `"left"` or `"right"`. Defaults to `"right"`.
+            padding_value (scalar or bool, optional): The padding value. Defaults to 0.0.
 
         """
         if not items:
             raise RuntimeError("items cannot be empty")
 
         if all(isinstance(item, torch.Tensor) for item in items):
-            return torch.stack(items, dim=dim, out=out)
+            # This must be implemented here and not in _get_str because we want to leverage this check
+            special_return = sum((as_list, as_padded_tensor, as_nested_tensor))
+            if special_return > 1:
+                raise TypeError(
+                    "as_list, as_padded_tensor and as_nested_tensor are exclusive."
+                )
+            elif special_return:
+                if as_padded_tensor:
+                    return pad_sequence(
+                        items,
+                        padding_value=padding_value,
+                        padding_side=padding_side,
+                        batch_first=True,
+                    )
+                if as_nested_tensor:
+                    if layout is None:
+                        layout = torch.jagged
+                    return torch.nested.as_nested_tensor(items, layout=layout)
+                if as_list:
+                    return items
+            try:
+                return torch.stack(items, dim=dim, out=out)
+            except RuntimeError as err:
+                raise RuntimeError(
+                    "Failed to stack tensors within a tensordict. You can use nested tensors, "
+                    "padded tensors or return lists via specialized keyword arguments. "
+                    "Check the TensorDict.lazy_stack documentation!"
+                ) from err
         if all(is_non_tensor(tensordict) for tensordict in items):
             # Non-tensor data (Data or Stack) are stacked using NonTensorStack
             # If the content is identical (not equal but same id) this does not
@@ -3521,14 +3654,14 @@ def _rename_subtds(self, names):
     def _change_batch_size(self, new_size: torch.Size) -> None:
         self._batch_size = new_size
 
-    def _get_str(self, key, default):
-        tensor = self._source._get_str(key, default)
+    def _get_str(self, key, default, **kwargs):
+        tensor = self._source._get_str(key, default, **kwargs)
         if tensor is default:
             return tensor
         return self._transform_value(tensor)
 
-    def _get_tuple(self, key, default):
-        tensor = self._source._get_tuple(key, default)
+    def _get_tuple(self, key, default, **kwargs):
+        tensor = self._source._get_tuple(key, default, **kwargs)
         if tensor is default:
             return tensor
         return self._transform_value(tensor)
diff --git a/tensordict/_td.py b/tensordict/_td.py
@@ -2695,19 +2695,19 @@ def _stack_onto_at_(
             # )
         return self
 
-    def _get_str(self, key, default):
+    def _get_str(self, key, default, **kwargs):
         first_key = key
         out = self._tensordict.get(first_key)
         if out is None:
             return self._default_get(first_key, default)
         return out
 
-    def _get_tuple(self, key, default):
-        first = self._get_str(key[0], default)
+    def _get_tuple(self, key, default, **kwargs):
+        first = self._get_str(key[0], default, **kwargs)
         if len(key) == 1 or first is default:
             return first
         try:
-            return first._get_tuple(key[1:], default=default)
+            return first._get_tuple(key[1:], default=default, **kwargs)
         except AttributeError as err:
             if "has no attribute" in str(err):
                 raise ValueError(
@@ -3823,16 +3823,16 @@ def _get_non_tensor(self, key: NestedKey, default=NO_DEFAULT):
             return out._source
         return out
 
-    def _get_str(self, key, default):
+    def _get_str(self, key, default, **kwargs):
         if key in self.keys() and _is_tensor_collection(self.entry_class(key)):
-            data = self._source._get_str(key, NO_DEFAULT)
+            data = self._source._get_str(key, NO_DEFAULT, **kwargs)
             if _pass_through(data):
                 return data[self.idx]
             return _SubTensorDict(data, self.idx)
-        return self._source._get_at_str(key, self.idx, default=default)
+        return self._source._get_at_str(key, self.idx, default=default, **kwargs)
 
-    def _get_tuple(self, key, default):
-        return self._source._get_at_tuple(key, self.idx, default=default)
+    def _get_tuple(self, key, default, **kwargs):
+        return self._source._get_at_tuple(key, self.idx, default=default, **kwargs)
 
     @lock_blocked
     def update(
diff --git a/tensordict/base.py b/tensordict/base.py
@@ -6436,6 +6436,9 @@ def get(self, key: NestedKey, *args, **kwargs) -> CompatibleType:
                     To adopt the old behavior, set the environment variable `export TD_GET_DEFAULTS_TO_NONE='0'` or call
                     :func`~tensordict.set_get_defaults_to_none(False)`.
 
+        .. note:: Keyword arguments can be passed to :meth:`~.get` when dealing with ragged tensors.
+            See :meth:`~tensordict.LazyStackedTensorDict.get` for a complete overview.
+
         Examples:
             >>> td = TensorDict({"x": 1}, batch_size=[])
             >>> td.get("x")
@@ -6449,26 +6452,28 @@ def get(self, key: NestedKey, *args, **kwargs) -> CompatibleType:
         # Find what the default is
         if args:
             default = args[0]
-            if len(args) > 1 or kwargs:
-                raise TypeError("only one (keyword) argument is allowed.")
-        elif kwargs:
+            if len(args) > 1:
+                raise TypeError("Only one arg is allowed in TD.get.")
+            elif "default" in kwargs:
+                raise TypeError("'default' arg was passed twice.")
+        elif "default" in kwargs:
             default = kwargs.pop("default")
-            if args or kwargs:
-                raise TypeError("only one (keyword) argument is allowed.")
+            if args:
+                raise TypeError("'default' arg was passed twice.")
         elif _GET_DEFAULTS_TO_NONE:
             default = None
         else:
             default = NO_DEFAULT
-        return self._get_tuple(key, default=default)
+        return self._get_tuple(key, default=default, **kwargs)
 
     @abc.abstractmethod
-    def _get_str(self, key, default): ...
+    def _get_str(self, key, default, **kwargs): ...
 
     @abc.abstractmethod
-    def _get_tuple(self, key, default): ...
+    def _get_tuple(self, key, default, **kwargs): ...
 
-    def _get_tuple_maybe_non_tensor(self, key, default):
-        result = self._get_tuple(key, default)
+    def _get_tuple_maybe_non_tensor(self, key, default, **kwargs):
+        result = self._get_tuple(key, default, **kwargs)
         if _pass_through(result):
             # Only lazy stacks of non tensors are actually tensordict instances
             if isinstance(result, TensorDictBase):
diff --git a/tensordict/nn/common.py b/tensordict/nn/common.py
@@ -851,6 +851,9 @@ class TensorDictModule(TensorDictModuleBase):
         method_kwargs (Dict[str, Any], optional): additional keyword arguments to be passed to the module's method being called.
         strict (bool, optional): if ``True``, the module will raise an exception if any of the inputs is missing from
             the input tensordict. Otherwise, a `None` value will be used as placeholder. Defaults to ``False``.
+        get_kwargs (dict[str, Any], optional): additional keyword arguments to be passed to the :meth:`~tensordict.TensorDictBase.get`
+            method. This is particularily useful when dealing with ragged tensors (see :meth:`~tensordict.LazyStackedTensorDict.get`).
+            Defaults to ``{}``.
 
     Embedding a neural network in a TensorDictModule only requires to specify the input
     and output keys. TensorDictModule support functional and regular :obj:`nn.Module`
@@ -1018,6 +1021,7 @@ def __init__(
         method: str | None = None,
         method_kwargs: dict | None = None,
         strict: bool = False,
+        get_kwargs: dict | None = None,
     ) -> None:
         super().__init__()
 
@@ -1097,6 +1101,7 @@ def __init__(
         self.inplace = inplace
         self.method = method
         self.method_kwargs = method_kwargs if method_kwargs is not None else {}
+        self._get_kwargs = get_kwargs if get_kwargs is not None else {}
 
     @property
     def is_functional(self) -> bool:
@@ -1180,7 +1185,9 @@ def forward(
             else:
                 tensors = tuple(
                     tensordict._get_tuple_maybe_non_tensor(
-                        _unravel_key_to_tuple(in_key), default
+                        _unravel_key_to_tuple(in_key),
+                        default,
+                        **self._get_kwargs,
                     )
                     for in_key in self.in_keys
                 )
@@ -1223,7 +1230,7 @@ def forward(
                     import inspect
 
                     module = inspect.getsource(module)
-                except OSError:
+                except Exception:
                     # then we can't print the source code
                     pass
             module = indent(str(module), 4 * " ")
diff --git a/tensordict/nn/probabilistic.py b/tensordict/nn/probabilistic.py
@@ -984,6 +984,14 @@ def __init__(
                 self._ordered_dict = True
             else:
                 modules = modules_list = list(modules[0])
+        elif len(modules) == 1 and isinstance(modules[0], dict):
+            modules = [collections.OrderedDict(modules[0])]
+            return self.__init__(
+                *modules,
+                partial_tolerant=partial_tolerant,
+                return_composite=return_composite,
+                inplace=inplace,
+            )
         elif not return_composite and not isinstance(
             modules[-1],
             (ProbabilisticTensorDictModule, ProbabilisticTensorDictSequential),
diff --git a/tensordict/persistent.py b/tensordict/persistent.py
@@ -354,7 +354,7 @@ def _process_array(self, key, array):
             return out
 
     @cache  # noqa: B019
-    def _get_str(self, key: NestedKey, default):
+    def _get_str(self, key: NestedKey, default, **kwargs):
         key = _unravel_key_to_tuple(key)
         array = self._get_array(key, default)
         if array is default:
diff --git a/tensordict/tensorclass.py b/tensordict/tensorclass.py
diff --git a/test/test_tensordict.py b/test/test_tensordict.py