[Feature] History.default_spec

Vincent Moens · Vincent Moens · commit 8ce11a859bb7 · 2025-04-07T15:39:10.000+01:00
ghstack-source-id: 40b8a49 Pull Request resolved: #2894
diff --git a/test/test_cost.py b/test/test_cost.py
@@ -16676,6 +16676,9 @@ def forward(self, td, mode):
 
 
 class TestPPO4LLMs:
+    @pytest.mark.skipif(
+        not _has_transformers, reason="transformers lib required to test PPO with LLMs"
+    )
     @set_capture_non_tensor_stack(False)
     @pytest.mark.parametrize("from_text", [True, False])
     def test_hf(self, from_text):
diff --git a/test/test_rb.py b/test/test_rb.py
@@ -4097,6 +4097,22 @@ def test_history_template_recover(self, mock_history, tokenizer):
         )
         recovered = history._inv_chatml(tokenizer.batch_decode(data_token)[0])
 
+    def test_history_spec(self):
+        history = History(
+            role=["system", "user", "assistant", "user"],
+            content=[
+                "i'm the system",
+                "i'm the user",
+                "I'm the assistant",
+                "I'm the user again",
+            ],
+        )
+        spec = history.default_spec()
+        r = spec.zero()
+        assert isinstance(r, History)
+        assert spec.is_in(r)
+        assert spec.is_in(history)
+
 
 if __name__ == "__main__":
     args, unknown = argparse.ArgumentParser().parse_known_args()
diff --git a/torchrl/data/llm/chat.py b/torchrl/data/llm/chat.py
@@ -4,7 +4,10 @@
 # LICENSE file in the root directory of this source tree.
 from __future__ import annotations
 
+import dataclasses
+
 import re
+from typing import Literal
 
 import torch
 
@@ -107,10 +110,11 @@ def apply_chat_template(
         padding: bool | str = False,
         truncation: bool | str = False,
         return_tensors: str | None = "pt",
+        **kwargs,
     ):
         """Applies a chat template to the history.
 
-        Args:
+        Keyword Args:
             tokenizer (transformers.PreTrainedTokenizer): The tokenizer to use.
             add_generation_prompt (bool, optional): Whether to add a generation prompt. Defaults to True.
             chat_template (str, optional): The chat template to use. Defaults to _TEMPLATES["chatml_format"].
@@ -119,6 +123,7 @@ def apply_chat_template(
             padding (bool | str, optional): The padding strategy to use. Defaults to False.
             truncation (bool | str, optional): The truncation strategy to use. Defaults to False.
             return_tensors (str | None, optional): The type of tensors to return. Defaults to "pt".
+            **kwargs: Additional keyword arguments to pass to the tokenizer `apply_chat_template` method.
 
         Returns:
             The formatted history.
@@ -135,6 +140,17 @@ def apply_chat_template(
             continue_final_message=continue_final_message,
         )
 
+    @classmethod
+    def inv_chat_template(
+        cls, text: str, chat_template_name: Literal["chatml_format"] = "chatml_format"
+    ) -> History:
+        if chat_template_name not in ("chatml_format",):
+            # Hard coded for now
+            raise NotImplementedError(
+                "chat_template_name must be one of ('chatml_format',)"
+            )
+        return cls._inv_chatml(text)
+
     @classmethod
     def _inv_chatml(cls, text: str) -> History:
         """Inverts a chatml string into a History object.
@@ -227,3 +243,64 @@ def extend(
                 self.__dict__["_tensordict"] = td
                 return self
         return torch.stack(list(self.unbind(dim)) + list(history.unbind(dim)), dim=dim)
+
+    @classmethod
+    def default_spec(cls, shape=(-1,)):
+        """A default spec to use in transforms / envs that return History objects.
+
+        Args:
+            shape (torch.Size, optional): The shape of the returned History spec. Defaults to `(-1)` (variable length
+                along time dimension).
+
+        Example:
+            >>> import tensordict
+            >>> from torchrl.data import History
+            >>> tensordict.set_list_to_stack(True).set()
+            >>>
+            >>> history = History(role=["system", "user"], content=["a message", "another message"], batch_size=(2,))
+            >>> spec = history.default_spec()
+            >>> print(spec)
+            Composite(
+                role: NonTensor(
+                    shape=torch.Size([-1]),
+                    space=None,
+                    device=None,
+                    dtype=None,
+                    domain=None,
+                    example_data=foo),
+                content: NonTensor(
+                    shape=torch.Size([-1]),
+                    space=None,
+                    device=None,
+                    dtype=None,
+                    domain=None,
+                    example_data=foo),
+                device=None,
+                shape=torch.Size([-1]))
+            >>> print(spec.zero())
+            History(
+                content=NonTensorData(data=foo, batch_size=torch.Size([1]), device=None),
+                role=NonTensorData(data=foo, batch_size=torch.Size([1]), device=None),
+                batch_size=torch.Size([1]),
+                device=None,
+                is_shared=False)
+
+        """
+        from torchrl.data import Composite, NonTensor
+
+        def get_default_value(field):
+            if field.default is not dataclasses.MISSING:
+                return field.default
+            elif field.type in (str, "str"):
+                return "foo"
+            else:
+                return None
+
+        defaults = {
+            k: NonTensor(
+                example_data=get_default_value(cls.__dataclass_fields__[k]), shape=(-1,)
+            )
+            for k in cls.__dataclass_fields__
+        }
+
+        return Composite(defaults, shape=shape, data_cls=cls)