diff --git a/torchtune/datasets/_chat.py b/torchtune/datasets/_chat.py index 285793085e..751fed95a3 100644 --- a/torchtune/datasets/_chat.py +++ b/torchtune/datasets/_chat.py @@ -91,7 +91,7 @@ def _prepare_sample(self, sample: Mapping[str, Any]) -> Tuple[List[int], List[in messages = self._convert_to_messages(sample, self.train_on_input) if self.chat_format is not None: messages = self.chat_format.format(messages) - validate_messages(messages) + #validate_messages(messages) tokens, mask = self._tokenizer.tokenize_messages( messages, max_seq_len=self.max_seq_len )