pytorch · vmoens · Jul 24, 2024 · Jul 24, 2024 · Jul 24, 2024
diff --git a/tensordict/base.py b/tensordict/base.py
@@ -9233,15 +9233,15 @@ def to(self, *args, **kwargs) -> T:
                     a dtype, the dtype is gathered from the example leaves.
                     If there are more than one dtype, then no dtype
                     casting is undertook.
-            pin_memory (bool, optional): if ``True``, the tensors are pinned before
+            non_blocking_pin (bool, optional): if ``True``, the tensors are pinned before
                 being sent to device. This will be done asynchronously but can be
                 controlled via the ``num_threads`` argument.
 
                 .. note:: Calling ``tensordict.pin_memory().to("cuda")`` will usually
-                    be much slower than ``tensordict.to("cuda", pin_memory=True)`` as
+                    be much slower than ``tensordict.to("cuda", non_blocking_pin=True)`` as
                     the pin_memory is called asynchronously in the second case.
 
-            num_threads (int or None, optional): if ``pin_memory=True``, the number
+            num_threads (int or None, optional): if ``non_blocking_pin=True``, the number
                 of threads to be used for ``pin_memory``. By default, multithreading
                 will be used with ``num_threads=None`` in
                 :meth:`~concurrent.futures.ThreadPoolExecutor(max_workers=None)`, which will
@@ -9269,7 +9269,7 @@ def to(self, *args, **kwargs) -> T:
             _,
             convert_to_format,
             batch_size,
-            pin_memory,
+            non_blocking_pin,
             num_threads,
         ) = _parse_to(*args, **kwargs)
         result = self
@@ -9302,7 +9302,7 @@ def to(tensor):
 
         apply_kwargs = {}
         if device is not None or dtype is not None:
-            if pin_memory and num_threads != 0:
+            if non_blocking_pin and num_threads != 0:
                 result = self._multithread_apply_nest(
                     lambda x: x.pin_memory(),
                     num_threads=num_threads,
@@ -9311,7 +9311,7 @@ def to(tensor):
                     checked=True,
                 )
             else:
-                if pin_memory:
+                if non_blocking_pin:
                     result = result.pin_memory()
                 apply_kwargs["device"] = device if device is not None else self.device
                 apply_kwargs["batch_size"] = batch_size

diff --git a/tensordict/persistent.py b/tensordict/persistent.py
@@ -973,12 +973,12 @@ def to(self, *args, **kwargs: Any) -> PersistentTensorDict:
             non_blocking,
             convert_to_format,
             batch_size,
-            pin_memory,
+            non_blocking_pin,
             num_threads,
         ) = _parse_to(*args, **kwargs)
-        if pin_memory:
+        if non_blocking_pin:
             raise RuntimeError(
-                f"Cannot call pin_memory {type(self).__name__}.to(). Call "
+                f"Cannot use non_blocking_pin=True {type(self).__name__}.to(). Call "
                 f"`to_tensordict()` before executing this code."
             )
         result = self

diff --git a/tensordict/utils.py b/tensordict/utils.py
@@ -1214,45 +1214,6 @@ def new_func(self, *args, **kwargs):
     return new_func
 
 
-# class as_decorator:
-#     """Converts a method to a decorator.
-#
-#     Examples:
-#         >>> from tensordict import TensorDict
-#         >>> data = TensorDict({}, [])
-#         >>> with data.lock_(): # lock_ is decorated
-#         ...     assert data.is_locked
-#         >>> assert not data.is_locked
-#     """
-#
-#     def __init__(self, attr=None):
-#         self.attr = attr
-#
-#     def __call__(self, func):
-#         if self.attr is not None:
-#
-#             @wraps(func)
-#             def new_func(_self, *args, **kwargs):
-#                 _attr_pre = getattr(_self, self.attr)
-#                 out = func(_self, *args, **kwargs)
-#                 _attr_post = getattr(_self, self.attr)
-#                 if out is not None:
-#                     if _attr_post is not _attr_pre:
-#                         out._last_op = (new_func.__name__, (args, kwargs, _self))
-#                     else:
-#                         out._last_op = None
-#                 return out
-#
-#         else:
-#
-#             @wraps(func)
-#             def new_func(_self, *args, **kwargs):
-#                 out = func(_self, *args, **kwargs)
-#                 if out is not None:
-#                     out._last_op = (new_func.__name__, (args, kwargs, _self))
-#                 return out
-#
-#         return new_func
 def _as_context_manager(attr=None):
     """Converts a method to a decorator.
 
@@ -1401,7 +1362,7 @@ def _split_generator():
 
 def _parse_to(*args, **kwargs):
     batch_size = kwargs.pop("batch_size", None)
-    pin_memory = kwargs.pop("pin_memory", False)
+    non_blocking_pin = kwargs.pop("non_blocking_pin", False)
     num_threads = kwargs.pop("num_threads", None)
     other = kwargs.pop("other", None)
     if not torch.compiler.is_dynamo_compiling():
@@ -1440,7 +1401,7 @@ def _parse_to(*args, **kwargs):
         non_blocking,
         convert_to_format,
         batch_size,
-        pin_memory,
+        non_blocking_pin,
         num_threads,
     )
 

diff --git a/test/test_tensordict.py b/test/test_tensordict.py
@@ -3035,30 +3035,39 @@ def test_cache(self, td_name, device, op):
     )
     @pytest.mark.parametrize("device_cast", get_available_devices())
     @pytest.mark.parametrize(
-        "pin_memory", [False] if not torch.cuda.is_available() else [False, True]
+        "non_blocking_pin", [False] if not torch.cuda.is_available() else [False, True]
     )
     @pytest.mark.parametrize("num_threads", [0, 1, 4, None])
-    def test_cast_device(self, td_name, device, device_cast, pin_memory, num_threads):
+    def test_cast_device(
+        self, td_name, device, device_cast, non_blocking_pin, num_threads
+    ):
         torch.manual_seed(1)
         td = getattr(self, td_name)(device)
-        if pin_memory and td_name == "td_h5":
+        if non_blocking_pin and td_name == "td_h5":
             with pytest.raises(
-                RuntimeError, match="Cannot call pin_memory PersistentTensorDict.to()"
+                RuntimeError,
+                match="Cannot use non_blocking_pin=True PersistentTensorDict.to()",
             ):
                 td_device = td.to(
-                    device_cast, pin_memory=pin_memory, num_threads=num_threads
+                    device_cast,
+                    non_blocking_pin=non_blocking_pin,
+                    num_threads=num_threads,
                 )
             return
 
-        if device.type == "cuda" and device_cast.type == "cpu" and pin_memory:
+        if device.type == "cuda" and device_cast.type == "cpu" and non_blocking_pin:
             with pytest.raises(
                 RuntimeError, match="only dense CPU tensors can be pinned"
             ):
                 td_device = td.to(
-                    device_cast, pin_memory=pin_memory, num_threads=num_threads
+                    device_cast,
+                    non_blocking_pin=non_blocking_pin,
+                    num_threads=num_threads,
                 )
             return
-        td_device = td.to(device_cast, pin_memory=pin_memory, num_threads=num_threads)
+        td_device = td.to(
+            device_cast, non_blocking_pin=non_blocking_pin, num_threads=num_threads
+        )
 
         for item in td_device.values():
             assert item.device == device_cast
@@ -8606,16 +8615,16 @@ def test_subtd(self):
 
     @pytest.mark.parametrize("device", get_available_devices())
     @pytest.mark.parametrize(
-        "pin_memory", [False] if not torch.cuda.is_available() else [False, True]
+        "non_blocking_pin", [False] if not torch.cuda.is_available() else [False, True]
     )
     @pytest.mark.parametrize("num_threads", [0, 1, 4, None])
-    def test_to(self, device, pin_memory, num_threads):
+    def test_to(self, device, non_blocking_pin, num_threads):
         td = TensorDict(
             {"": TensorDict({}, [3, 4, 1, 6])},
             batch_size=[3, 4, 1, 6],
             names=["a", "b", "c", "d"],
         )
-        tdt = td.to(device, pin_memory=pin_memory, num_threads=num_threads)
+        tdt = td.to(device, non_blocking_pin=non_blocking_pin, num_threads=num_threads)
         assert tdt.names == ["a", "b", "c", "d"]
 
     def test_unbind(self):