[Feature] broadcast tensordicts

Vincent Moens · Vincent Moens · commit 29598633e9ee · 2025-05-02T10:58:18.000+01:00
ghstack-source-id: 3b142c9 Pull-Request-resolved: #1307
diff --git a/tensordict/_reductions.py b/tensordict/_reductions.py
@@ -12,7 +12,7 @@
 from tensordict._td import TensorDict
 
 from tensordict.tensorclass import NonTensorData, NonTensorStack
-from tensordict.utils import _is_tensorclass, _STRDTYPE2DTYPE
+from tensordict.utils import _is_tensorclass, _STR_DTYPE_TO_DTYPE
 
 CLS_MAP = {
     "TensorDict": TensorDict,
@@ -99,7 +99,7 @@ def from_metadata(metadata=metadata, prefix=None):
             for (key, (data, batch_size, device)) in non_tensor.items()
         }
         for key, (dtype, local_shape, start, stop, pad) in leaves.items():
-            dtype = _STRDTYPE2DTYPE[dtype]
+            dtype = _STR_DTYPE_TO_DTYPE[dtype]
             # device = torch.device(device)
             local_shape = torch.Size(local_shape)
             value = storage[start:stop].view(dtype)
diff --git a/tensordict/_td.py b/tensordict/_td.py
@@ -67,7 +67,7 @@
     _set_item,
     _set_max_batch_size,
     _shape,
-    _STRDTYPE2DTYPE,
+    _STR_DTYPE_TO_DTYPE,
     _StringKeys,
     _StringOnlyDict,
     _sub_index,
@@ -2836,7 +2836,7 @@ def _load_memmap(
                 else:
                     shape = torch.Size(shape)
                 tensor = MemoryMappedTensor.from_filename(
-                    dtype=_STRDTYPE2DTYPE[dtype],
+                    dtype=_STR_DTYPE_TO_DTYPE[dtype],
                     shape=shape,
                     filename=str(prefix / f"{key}.memmap"),
                 )
@@ -2846,7 +2846,7 @@ def _load_memmap(
                 tensor = torch.zeros(
                     torch.Size(shape),
                     device=device,
-                    dtype=_STRDTYPE2DTYPE[dtype],
+                    dtype=_STR_DTYPE_TO_DTYPE[dtype],
                 )
             result._set_str(
                 key,
diff --git a/tensordict/base.py b/tensordict/base.py
@@ -56,7 +56,7 @@
     _as_context_manager,
     _CloudpickleWrapper,
     _convert_list_to_stack,
-    _DTYPE2STRDTYPE,
+    _DTYPE_TO_STR_DTYPE,
     _GENERIC_NESTED_ERR,
     _is_dataclass as is_dataclass,
     _is_list_tensor_compatible,
@@ -79,6 +79,7 @@
     _set_max_batch_size,
     _shape,
     _split_tensordict,
+    _STR_DTYPE_TO_DTYPE,
     _td_fields,
     _unravel_key_to_tuple,
     _zip_strict,
@@ -5061,7 +5062,7 @@ def add_single_value(value, key, metadata_dict, dtype, shape, flat_size):
             stop = sum([start, flat_size[-1]])
             if requires_metadata:
                 metadata_dict["leaves"][key] = (
-                    _DTYPE2STRDTYPE[dtype],
+                    _DTYPE_TO_STR_DTYPE[dtype],
                     list(shape),
                     # _DEVICE2STRDEVICE[device],
                     start,
@@ -7953,11 +7954,161 @@ def _recv(
 
         return _tag
 
+    def init_remote(
+        self,
+        dst: int,
+        group: "ProcessGroup" | None = None,  # noqa: F821
+        device: torch.device | None = None,
+    ):
+        """Initializes a remote tensordict by sending its metadata and content.
+
+        This method sends the metadata (shape, dtype, etc.) of the current tensordict to the specified destination rank (`dst`).
+
+        It then asynchronously sends the actual tensordict content.
+
+        Args:
+            dst (int): The rank of the destination process.
+            group ("ProcessGroup", optional): The process group to use for communication. Defaults to None.
+            device (torch.device, optional): The device to use for tensor operations. Defaults to None.
+
+        .. seealso::
+            The receiving process should call `~.from_remote_init` or an equivalent method to receive and initialize a new tensordict based on the sent metadata.
+
+        Examples:
+            >>> import os
+            >>> import torch
+            >>> import torch.distributed as dist
+            >>> from tensordict import TensorDict, MemoryMappedTensor
+            >>> import multiprocessing as mp
+            >>>
+            >>> def server(queue):
+            ...     # Set environment variables for distributed communication
+            ...     os.environ["MASTER_ADDR"] = "localhost"
+            ...     os.environ["MASTER_PORT"] = "29505"
+            ...
+            ...     # Initialize the distributed backend
+            ...     dist.init_process_group("gloo", rank=0, world_size=2)
+            ...
+            ...     # Create a sample tensordict
+            ...     td = (
+            ...         TensorDict(
+            ...             {
+            ...                 ("a", "b"): torch.ones(2),
+            ...                 "c": torch.ones(2),
+            ...                 ("d", "e", "f"): MemoryMappedTensor.from_tensor(torch.ones(2, 2)),
+            ...             },
+            ...             [2],
+            ...         )
+            ...         .expand(1, 2)
+            ...         .contiguous()
+            ...     )
+            ...
+            ...     # Send the tensordict metadata and content to the client
+            ...     td.init_remote(dst=1)
+            ...
+            >>> def client(queue):
+            ...     # Set environment variables for distributed communication
+            ...     os.environ["MASTER_ADDR"] = "localhost"
+            ...     os.environ["MASTER_PORT"] = "29505"
+            ...
+            ...     # Initialize the distributed backend
+            ...     dist.init_process_group("gloo", rank=1, world_size=2)
+            ...
+            ...     # Receive the tensordict metadata and content from the server
+            ...     received_td = TensorDict.from_remote_init(src=0)
+            ...
+            ...     # Verify that the received tensordict matches the expected structure and values
+            ...     assert set(received_td.keys()) == {"a", "c", "d"}
+            ...     assert (received_td == 1).all()
+            ...
+            ...     # Signal that the test has completed successfully
+            ...     queue.put("yuppie")
+            >>>
+            >>> if __name__ == "__main__":
+            ...     queue = mp.Queue(1)
+            ...
+            ...     # Create and start the server and client processes
+            ...     main_worker = mp.Process(target=server, args=(queue,))
+            ...     secondary_worker = mp.Process(target=client, args=(queue,))
+            ...
+            ...     main_worker.start()
+            ...     secondary_worker.start()
+            ...
+            ...     try:
+            ...         out = queue.get(timeout=10)  # Wait for the signal with a timeout
+            ...         print(out)  # Should print "yuppie"
+            ...     finally:
+            ...         queue.close()
+            ...         main_worker.join(timeout=10)
+            ...         secondary_worker.join(timeout=10)
+        """
+        # Get a list of key - specs
+        data = [
+            {
+                k: (tuple(val.shape), str(val.dtype), str(val.device))
+                for k, val in self.items(True, True)
+            },
+            self.batch_size,
+            self.device,
+            self.is_locked,
+        ]
+        torch.distributed.send_object_list(
+            data,
+            dst=dst,
+            group=group,
+            device=device,
+        )
+        self.isend(dst, group=group)
+
+    @classmethod
+    def from_remote_init(
+        cls: T,
+        src: int,
+        group: "ProcessGroup" | None = None,  # noqa: F821
+        device: torch.device | None = None,
+    ) -> T:
+        """Creates a new tensordict instance initialized from remotely sent metadata.
+
+        This class method receives the metadata sent by `init_remote`, creates a new tensordict with matching shape and dtype,
+        and then asynchronously receives the actual tensordict content.
+
+        Args:
+            src (int): The rank of the source process that sent the metadata.
+            group ("ProcessGroup", optional): The process group to use for communication. Defaults to None.
+            device (torch.device, optional): The device to use for tensor operations. Defaults to None.
+
+        Returns:
+            TensorDict: A new tensordict instance initialized with the received metadata and content.
+
+        .. seealso::
+            The sending process should have called `~.init_remote` to send the metadata and content.
+        """
+        data = [None, None, None, None]
+        torch.distributed.recv_object_list(
+            data,
+            src=src,
+            group=group,
+            device=device,
+        )
+        metadata = data[0]
+        td = cls(
+            {
+                k: torch.empty(v[0], dtype=_STR_DTYPE_TO_DTYPE[v[1]], device=v[2])
+                for k, v in metadata.items()
+            },
+            batch_size=data[1],
+            device=data[2],
+        )
+        if data[3]:
+            td.lock_()
+        td.irecv(src=src, group=group)
+        return td
+
     def isend(
         self,
         dst: int,
         *,
-        group: "torch.distributed.ProcessGroup" | None = None,
+        group: "torch.distributed.ProcessGroup" | None = None,   # noqa: F821
         init_tag: int = 0,
         pseudo_rand: bool = False,
         return_early: bool = False,
@@ -8048,7 +8199,13 @@ def isend(
             ...     secondary_worker.join()
 
         """
-        return self._isend(dst, _tag=init_tag - 1, pseudo_rand=pseudo_rand, group=group, return_early=return_early)
+        return self._isend(
+            dst,
+            _tag=init_tag - 1,
+            pseudo_rand=pseudo_rand,
+            group=group,
+            return_early=return_early,
+        )
 
     def _isend(
         self,
@@ -8057,7 +8214,7 @@ def _isend(
         _futures: list[torch.Future] | None = None,
         pseudo_rand: bool = False,
         group: "torch.distributed.ProcessGroup" | None = None,
-            return_early: bool = False,
+        return_early: bool = False,
     ) -> int:
         from torch import distributed as dist
 
diff --git a/tensordict/tensorclass.pyi b/tensordict/tensorclass.pyi
@@ -704,6 +704,22 @@ class TensorClass:
         init_tag: int = 0,
         pseudo_rand: bool = False,
     ) -> int: ...
+    def broadcast_content(
+        self,
+        src: int,
+        dst: int,
+        group: "ProcessGroup" | None = None,
+        device: torch.device | None = None,
+        group_src: "ProcessGroup" | None = None,
+    ): ...
+    @classmethod
+    def from_broadcast(
+        cls,
+        src: int,
+        group: "ProcessGroup" | None = None,
+        device: torch.device | None = None,
+        group_src: "ProcessGroup" | None = None,
+    ): ...
     def isend(
         self,
         dst: int,
diff --git a/tensordict/utils.py b/tensordict/utils.py
@@ -147,8 +147,10 @@ def dims(self, *args, **kwargs):
     _TORCH_DTYPES = _TORCH_DTYPES + (torch.uint32,)
 if hasattr(torch, "uint64"):
     _TORCH_DTYPES = _TORCH_DTYPES + (torch.uint64,)
-_STRDTYPE2DTYPE = {str(dtype): dtype for dtype in _TORCH_DTYPES}
-_DTYPE2STRDTYPE = {dtype: str_dtype for str_dtype, dtype in _STRDTYPE2DTYPE.items()}
+_STR_DTYPE_TO_DTYPE = {str(dtype): dtype for dtype in _TORCH_DTYPES}
+_DTYPE_TO_STR_DTYPE = {
+    dtype: str_dtype for str_dtype, dtype in _STR_DTYPE_TO_DTYPE.items()
+}
 
 IndexType = Union[None, int, slice, str, Tensor, List[Any], Tuple[Any, ...]]
 DeviceType = Union[torch.device, str, int]
diff --git a/test/test_distributed.py b/test/test_distributed.py
@@ -761,6 +761,65 @@ def make_td(ones):
         return td
 
 
+class TestInitRemote:
+    port = "29505"
+
+    @classmethod
+    def client(cls, queue, rank):
+        os.environ["MASTER_ADDR"] = "localhost"
+        os.environ["MASTER_PORT"] = cls.port
+        dist.init_process_group(
+            "gloo",
+            rank=rank,
+            world_size=2,
+        )
+
+        td = TensorDict.from_remote_init(src=0)
+        assert set(td.keys()) == {"a", "c", "d"}
+        assert (td == 1).all()
+        queue.put("yuppie")
+
+    @classmethod
+    def server(cls, queue):
+        os.environ["MASTER_ADDR"] = "localhost"
+        os.environ["MASTER_PORT"] = cls.port
+        dist.init_process_group(
+            "gloo",
+            rank=0,
+            world_size=2,
+        )
+
+        td = (
+            TensorDict(
+                {
+                    ("a", "b"): torch.ones(2),
+                    "c": torch.ones(2),
+                    ("d", "e", "f"): MemoryMappedTensor.from_tensor(torch.ones(2, 2)),
+                },
+                [2],
+            )
+            .expand(1, 2)
+            .contiguous()
+        )
+        td.init_remote(dst=1)
+
+    def test_init_remote(self, set_context, tmp_path):
+        queue = mp.Queue(1)
+        main_worker = mp.Process(target=type(self).server, args=(queue,))
+        secondary_worker = mp.Process(target=type(self).client, args=(queue, 1))
+
+        main_worker.start()
+        secondary_worker.start()
+        out = None
+        try:
+            out = queue.get(timeout=TIMEOUT)
+        finally:
+            queue.close()
+            main_worker.join(timeout=TIMEOUT)
+            secondary_worker.join(timeout=TIMEOUT)
+            assert out == "yuppie"
+
+
 if __name__ == "__main__":
     args, unknown = argparse.ArgumentParser().parse_known_args()
     pytest.main([__file__, "--capture", "no", "--exitfirst"] + unknown)