[Feature] Rework to_one_hot and to_categorical to take a tensor as parameter (#816)

riiswa · web-flow · commit 099ced3f7b1f · 2023-02-20T16:36:35.000Z
diff --git a/test/test_specs.py b/test/test_specs.py
@@ -240,9 +240,9 @@ def test_mult_onehot(shape, ns):
         for _r, _n in zip(rsplit, ns):
             assert (_r.sum(-1) == 1).all()
             assert _r.shape[-1] == _n
-        np_r = ts.to_numpy(r)
-        assert not ts.is_in(torch.tensor(np_r))
-        assert (ts.encode(np_r) == r).all()
+        categorical = ts.to_categorical(r)
+        assert not ts.is_in(categorical)
+        assert (ts.encode(categorical) == r).all()
 
 
 @pytest.mark.parametrize(
@@ -327,8 +327,11 @@ def test_discrete_conversion(n, device, shape):
     one_hot = OneHotDiscreteTensorSpec(n, device=device, shape=shape_one_hot)
 
     assert categorical != one_hot
-    assert categorical.to_onehot() == one_hot
-    assert one_hot.to_categorical() == categorical
+    assert categorical.to_one_hot_spec() == one_hot
+    assert one_hot.to_categorical_spec() == categorical
+
+    assert categorical.is_in(one_hot.to_categorical(one_hot.rand(shape)))
+    assert one_hot.is_in(categorical.to_one_hot(categorical.rand(shape)))
 
 
 @pytest.mark.parametrize(
@@ -341,14 +344,24 @@ def test_discrete_conversion(n, device, shape):
         [4, 5, 1, 3],
     ],
 )
+@pytest.mark.parametrize(
+    "shape",
+    [
+        torch.Size([3]),
+        torch.Size([4, 5]),
+    ],
+)
 @pytest.mark.parametrize("device", get_available_devices())
-def test_multi_discrete_conversion(ns, device):
+def test_multi_discrete_conversion(ns, shape, device):
     categorical = MultiDiscreteTensorSpec(ns, device=device)
     one_hot = MultiOneHotDiscreteTensorSpec(ns, device=device)
 
     assert categorical != one_hot
-    assert categorical.to_onehot() == one_hot
-    assert one_hot.to_categorical() == categorical
+    assert categorical.to_one_hot_spec() == one_hot
+    assert one_hot.to_categorical_spec() == categorical
+
+    assert categorical.is_in(one_hot.to_categorical(one_hot.rand(shape)))
+    assert one_hot.is_in(categorical.to_one_hot(categorical.rand(shape)))
 
 
 @pytest.mark.parametrize("is_complete", [True, False])
@@ -1019,21 +1032,22 @@ def test_mult_discrete_action_spec_reconstruct(self):
         action_spec = MultiOneHotDiscreteTensorSpec((10, 5))
 
         actions_tensors = [action_spec.rand() for _ in range(10)]
-        actions_numpy = [action_spec.to_numpy(a) for a in actions_tensors]
-        actions_tensors_2 = [action_spec.encode(a) for a in actions_numpy]
+        actions_categorical = [action_spec.to_categorical(a) for a in actions_tensors]
+        actions_tensors_2 = [action_spec.encode(a) for a in actions_categorical]
         assert all(
             [(a1 == a2).all() for a1, a2 in zip(actions_tensors, actions_tensors_2)]
         )
 
-        actions_numpy = [
-            np.concatenate(
-                [np.random.randint(0, 10, (1,)), np.random.randint(0, 5, (1,))], 0
-            )
+        actions_categorical = [
+            torch.cat((torch.randint(0, 10, (1,)), torch.randint(0, 5, (1,))), 0)
             for a in actions_tensors
         ]
-        actions_tensors = [action_spec.encode(a) for a in actions_numpy]
-        actions_numpy_2 = [action_spec.to_numpy(a) for a in actions_tensors]
-        assert all((a1 == a2).all() for a1, a2 in zip(actions_numpy, actions_numpy_2))
+        actions_tensors = [action_spec.encode(a) for a in actions_categorical]
+        actions_categorical_2 = [action_spec.to_categorical(a) for a in actions_tensors]
+        assert all(
+            (a1 == a2).all()
+            for a1, a2 in zip(actions_categorical, actions_categorical_2)
+        )
 
     def test_one_hot_discrete_action_spec_rand(self):
         torch.manual_seed(0)
@@ -1070,14 +1084,14 @@ def test_mult_discrete_action_spec_rand(self):
         action_spec = MultiOneHotDiscreteTensorSpec((10, 5))
 
         actions_tensors = [action_spec.rand() for _ in range(10)]
-        actions_numpy = [action_spec.to_numpy(a) for a in actions_tensors]
-        actions_tensors_2 = [action_spec.encode(a) for a in actions_numpy]
+        actions_categorical = [action_spec.to_categorical(a) for a in actions_tensors]
+        actions_tensors_2 = [action_spec.encode(a) for a in actions_categorical]
         assert all(
             [(a1 == a2).all() for a1, a2 in zip(actions_tensors, actions_tensors_2)]
         )
 
-        sample = np.stack(
-            [action_spec.to_numpy(action_spec.rand()) for _ in range(N)], 0
+        sample = torch.stack(
+            [action_spec.to_categorical(action_spec.rand()) for _ in range(N)], 0
         )
         assert sample.shape[0] == N
         assert sample.shape[1] == 2
diff --git a/torchrl/data/tensor_specs.py b/torchrl/data/tensor_specs.py
@@ -618,9 +618,28 @@ def __eq__(self, other):
             and self.use_register == other.use_register
         )
 
-    def to_categorical(self) -> DiscreteTensorSpec:
+    def to_categorical(self, val: torch.Tensor, safe: bool = True) -> torch.Tensor:
+        """Converts a given one-hot tensor in categorical format.
+
+        Args:
+            val (torch.Tensor, optional): One-hot tensor to convert in categorical format.
+            safe (bool): boolean value indicating whether a check should be
+                performed on the value against the domain of the spec.
+
+        Returns:
+            The categorical tensor.
+        """
+        if safe:
+            self.assert_is_in(val)
+        return val.argmax(-1)
+
+    def to_categorical_spec(self) -> DiscreteTensorSpec:
+        """Converts the spec to the equivalent categorical spec."""
         return DiscreteTensorSpec(
-            self.space.n, device=self.device, dtype=self.dtype, shape=self.shape[:-1]
+            self.space.n,
+            device=self.device,
+            dtype=self.dtype,
+            shape=self.shape[:-1],
         )
 
 
@@ -1184,13 +1203,6 @@ def _split(self, val: torch.Tensor) -> Optional[torch.Tensor]:
             return None
         return val.split(split_sizes, dim=-1)
 
-    def to_numpy(self, val: torch.Tensor, safe: bool = True) -> np.ndarray:
-        if safe:
-            self.assert_is_in(val)
-        vals = self._split(val)
-        out = torch.stack([val.argmax(-1) for val in vals], -1).numpy()
-        return out
-
     def index(self, index: INDEX_TYPING, tensor_to_index: torch.Tensor) -> torch.Tensor:
         if not isinstance(index, torch.Tensor):
             raise ValueError(
@@ -1219,8 +1231,24 @@ def _project(self, val: torch.Tensor) -> torch.Tensor:
         vals = self._split(val)
         return torch.cat([super()._project(_val) for _val in vals], -1)
 
-    def to_categorical(self) -> MultiDiscreteTensorSpec:
+    def to_categorical(self, val: torch.Tensor, safe: bool = True) -> torch.Tensor:
+        """Converts a given one-hot tensor in categorical format.
+
+        Args:
+            val (torch.Tensor, optional): One-hot tensor to convert in categorical format.
+            safe (bool): boolean value indicating whether a check should be
+                performed on the value against the domain of the spec.
 
+        Returns:
+            The categorical tensor.
+        """
+        if safe:
+            self.assert_is_in(val)
+        vals = self._split(val)
+        return torch.stack([val.argmax(-1) for val in vals], -1)
+
+    def to_categorical_spec(self) -> MultiDiscreteTensorSpec:
+        """Converts the spec to the equivalent categorical spec."""
         return MultiDiscreteTensorSpec(
             [_space.n for _space in self.space],
             device=self.device,
@@ -1321,12 +1349,23 @@ def __eq__(self, other):
     def to_numpy(self, val: TensorDict, safe: bool = True) -> dict:
         return super().to_numpy(val, safe)
 
-    def to_onehot(self) -> OneHotDiscreteTensorSpec:
-        # if len(self.shape) > 1:
-        #     raise RuntimeError(
-        #         f"DiscreteTensorSpec with shape that has several dimensions can't be converted to "
-        #         f"OneHotDiscreteTensorSpec. Got shape={self.shape}."
-        #     )
+    def to_one_hot(self, val: torch.Tensor, safe: bool = True) -> torch.Tensor:
+        """Encodes a discrete tensor from the spec domain into its one-hot correspondent.
+
+        Args:
+            val (torch.Tensor, optional): Tensor to one-hot encode.
+            safe (bool): boolean value indicating whether a check should be
+                performed on the value against the domain of the spec.
+
+        Returns:
+            The one-hot encoded tensor.
+        """
+        if safe:
+            self.assert_is_in(val)
+        return torch.nn.functional.one_hot(val, self.space.n)
+
+    def to_one_hot_spec(self) -> OneHotDiscreteTensorSpec:
+        """Converts the spec to the equivalent one-hot spec."""
         shape = [*self.shape, self.space.n]
         return OneHotDiscreteTensorSpec(
             n=self.space.n, shape=shape, device=self.device, dtype=self.dtype
@@ -1488,17 +1527,41 @@ def is_in(self, val: torch.Tensor) -> bool:
         )
         if self.dtype != val.dtype or len(self.shape) > val.ndim or val_have_wrong_dim:
             return False
+        val_device = val.device
+        return (
+            (
+                (val >= torch.zeros(self.nvec.size(), device=val_device))
+                & (val < self.nvec.to(val_device))
+            )
+            .all()
+            .item()
+        )
 
-        return ((val >= torch.zeros(self.nvec.size())) & (val < self.nvec)).all().item()
+    def to_one_hot(
+        self, val: torch.Tensor, safe: bool = True
+    ) -> Union[MultiOneHotDiscreteTensorSpec, torch.Tensor]:
+        """Encodes a discrete tensor from the spec domain into its one-hot correspondent.
 
-    def to_onehot(self) -> MultiOneHotDiscreteTensorSpec:
-        if len(self.shape) > 1:
-            raise RuntimeError(
-                f"DiscreteTensorSpec with shape that has several dimensions can't be converted to"
-                f"OneHotDiscreteTensorSpec. Got shape={self.shape}. This could be accomplished via padding or "
-                f"nestedtensors but it is not implemented yet. If you would like to see that feature, please submit "
-                f"an issue of torchrl's github repo. "
-            )
+        Args:
+            val (torch.Tensor, optional): Tensor to one-hot encode.
+            safe (bool): boolean value indicating whether a check should be
+                performed on the value against the domain of the spec.
+
+        Returns:
+            The one-hot encoded tensor.
+        """
+        if safe:
+            self.assert_is_in(val)
+        return torch.cat(
+            [
+                torch.nn.functional.one_hot(val[..., i], n)
+                for i, n in enumerate(self.nvec)
+            ],
+            -1,
+        ).to(self.device)
+
+    def to_one_hot_spec(self) -> MultiOneHotDiscreteTensorSpec:
+        """Converts the spec to the equivalent one-hot spec."""
         nvec = [_space.n for _space in self.space]
         return MultiOneHotDiscreteTensorSpec(
             nvec,